├── house-price-prediction.ipynb ├── pima-indians-diabetes-database-svm-accuracy-79.ipynb └── winequality-prediction.ipynb /house-price-prediction.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "code", 5 | "execution_count": 3, 6 | "id": "6dac32b6", 7 | "metadata": { 8 | "execution": { 9 | "iopub.execute_input": "2022-11-05T08:25:27.182542Z", 10 | "iopub.status.busy": "2022-11-05T08:25:27.182052Z", 11 | "iopub.status.idle": "2022-11-05T08:25:28.811001Z", 12 | "shell.execute_reply": "2022-11-05T08:25:28.809695Z" 13 | }, 14 | "papermill": { 15 | "duration": 1.645588, 16 | "end_time": "2022-11-05T08:25:28.814117", 17 | "exception": false, 18 | "start_time": "2022-11-05T08:25:27.168529", 19 | "status": "completed" 20 | }, 21 | "tags": [] 22 | }, 23 | "outputs": [], 24 | "source": [ 25 | "import pandas as pd \n", 26 | "import numpy as np \n", 27 | "import matplotlib.pyplot as plt\n", 28 | "import seaborn as sns\n", 29 | "from sklearn.preprocessing import LabelEncoder\n", 30 | "from sklearn.linear_model import LinearRegression\n", 31 | "from sklearn.ensemble import RandomForestRegressor\n", 32 | "from sklearn.model_selection import train_test_split \n", 33 | "from sklearn.metrics import mean_squared_error,mean_absolute_percentage_error" 34 | ] 35 | }, 36 | { 37 | "cell_type": "code", 38 | "execution_count": 4, 39 | "id": "c9020f95", 40 | "metadata": { 41 | "execution": { 42 | "iopub.execute_input": "2022-11-05T08:25:28.860843Z", 43 | "iopub.status.busy": "2022-11-05T08:25:28.859652Z", 44 | "iopub.status.idle": "2022-11-05T08:25:28.913453Z", 45 | "shell.execute_reply": "2022-11-05T08:25:28.912083Z" 46 | }, 47 | "papermill": { 48 | "duration": 0.069995, 49 | "end_time": "2022-11-05T08:25:28.916626", 50 | "exception": false, 51 | "start_time": "2022-11-05T08:25:28.846631", 52 | "status": "completed" 53 | }, 54 | "tags": [] 55 | }, 56 | "outputs": [], 57 | "source": [ 58 | "data =pd.read_csv(\"D:\\House pricece\\data.csv\")" 59 | ] 60 | }, 61 | { 62 | "cell_type": "code", 63 | "execution_count": 5, 64 | "id": "819a0220", 65 | "metadata": { 66 | "execution": { 67 | "iopub.execute_input": "2022-11-05T08:25:28.958510Z", 68 | "iopub.status.busy": "2022-11-05T08:25:28.958043Z", 69 | "iopub.status.idle": "2022-11-05T08:25:28.994409Z", 70 | "shell.execute_reply": "2022-11-05T08:25:28.993136Z" 71 | }, 72 | "papermill": { 73 | "duration": 0.051362, 74 | "end_time": "2022-11-05T08:25:28.997674", 75 | "exception": false, 76 | "start_time": "2022-11-05T08:25:28.946312", 77 | "status": "completed" 78 | }, 79 | "tags": [] 80 | }, 81 | "outputs": [ 82 | { 83 | "data": { 84 | "text/html": [ 85 | "
\n", 86 | "\n", 99 | "\n", 100 | " \n", 101 | " \n", 102 | " \n", 103 | " \n", 104 | " \n", 105 | " \n", 106 | " \n", 107 | " \n", 108 | " \n", 109 | " \n", 110 | " \n", 111 | " \n", 112 | " \n", 113 | " \n", 114 | " \n", 115 | " \n", 116 | " \n", 117 | " \n", 118 | " \n", 119 | " \n", 120 | " \n", 121 | " \n", 122 | " \n", 123 | " \n", 124 | " \n", 125 | " \n", 126 | " \n", 127 | " \n", 128 | " \n", 129 | " \n", 130 | " \n", 131 | " \n", 132 | " \n", 133 | " \n", 134 | " \n", 135 | " \n", 136 | " \n", 137 | " \n", 138 | " \n", 139 | " \n", 140 | " \n", 141 | " \n", 142 | " \n", 143 | " \n", 144 | " \n", 145 | " \n", 146 | " \n", 147 | " \n", 148 | " \n", 149 | " \n", 150 | " \n", 151 | " \n", 152 | " \n", 153 | " \n", 154 | " \n", 155 | " \n", 156 | " \n", 157 | " \n", 158 | " \n", 159 | " \n", 160 | " \n", 161 | " \n", 162 | " \n", 163 | " \n", 164 | " \n", 165 | " \n", 166 | " \n", 167 | " \n", 168 | " \n", 169 | " \n", 170 | " \n", 171 | " \n", 172 | " \n", 173 | " \n", 174 | " \n", 175 | " \n", 176 | " \n", 177 | " \n", 178 | " \n", 179 | " \n", 180 | " \n", 181 | " \n", 182 | " \n", 183 | " \n", 184 | " \n", 185 | " \n", 186 | " \n", 187 | " \n", 188 | " \n", 189 | " \n", 190 | " \n", 191 | " \n", 192 | " \n", 193 | " \n", 194 | "
pricebedroomsbathroomssqft_livingsqft_lotfloorswaterfrontviewconditionsqft_abovesqft_basementcity
0313000.03.01.50134079121.500313400Shoreline
12384000.05.02.50365090502.00453370280Seattle
2342000.03.02.001930119471.000419300Kent
3420000.03.02.25200080301.000410001000Bellevue
4550000.04.02.501940105001.00041140800Redmond
\n", 195 | "
" 196 | ], 197 | "text/plain": [ 198 | " price bedrooms bathrooms sqft_living sqft_lot floors waterfront \\\n", 199 | "0 313000.0 3.0 1.50 1340 7912 1.5 0 \n", 200 | "1 2384000.0 5.0 2.50 3650 9050 2.0 0 \n", 201 | "2 342000.0 3.0 2.00 1930 11947 1.0 0 \n", 202 | "3 420000.0 3.0 2.25 2000 8030 1.0 0 \n", 203 | "4 550000.0 4.0 2.50 1940 10500 1.0 0 \n", 204 | "\n", 205 | " view condition sqft_above sqft_basement city \n", 206 | "0 0 3 1340 0 Shoreline \n", 207 | "1 4 5 3370 280 Seattle \n", 208 | "2 0 4 1930 0 Kent \n", 209 | "3 0 4 1000 1000 Bellevue \n", 210 | "4 0 4 1140 800 Redmond " 211 | ] 212 | }, 213 | "execution_count": 5, 214 | "metadata": {}, 215 | "output_type": "execute_result" 216 | } 217 | ], 218 | "source": [ 219 | "\n", 220 | "data = data.drop(['date','country',\"street\",\"statezip\",\"yr_built\",\"yr_renovated\"],axis=1)\n", 221 | "data.head()" 222 | ] 223 | }, 224 | { 225 | "cell_type": "code", 226 | "execution_count": 6, 227 | "id": "87b54c71", 228 | "metadata": { 229 | "execution": { 230 | "iopub.execute_input": "2022-11-05T08:25:29.020509Z", 231 | "iopub.status.busy": "2022-11-05T08:25:29.019655Z", 232 | "iopub.status.idle": "2022-11-05T08:25:29.025233Z", 233 | "shell.execute_reply": "2022-11-05T08:25:29.023946Z" 234 | }, 235 | "papermill": { 236 | "duration": 0.01951, 237 | "end_time": "2022-11-05T08:25:29.027633", 238 | "exception": false, 239 | "start_time": "2022-11-05T08:25:29.008123", 240 | "status": "completed" 241 | }, 242 | "tags": [] 243 | }, 244 | "outputs": [], 245 | "source": [ 246 | "le = LabelEncoder()" 247 | ] 248 | }, 249 | { 250 | "cell_type": "code", 251 | "execution_count": 7, 252 | "id": "79e08a06", 253 | "metadata": { 254 | "execution": { 255 | "iopub.execute_input": "2022-11-05T08:25:29.050061Z", 256 | "iopub.status.busy": "2022-11-05T08:25:29.049622Z", 257 | "iopub.status.idle": "2022-11-05T08:25:29.058985Z", 258 | "shell.execute_reply": "2022-11-05T08:25:29.057952Z" 259 | }, 260 | "papermill": { 261 | "duration": 0.023815, 262 | "end_time": "2022-11-05T08:25:29.061671", 263 | "exception": false, 264 | "start_time": "2022-11-05T08:25:29.037856", 265 | "status": "completed" 266 | }, 267 | "tags": [] 268 | }, 269 | "outputs": [], 270 | "source": [ 271 | "data['city_new'] = le.fit_transform(data['city'])\n" 272 | ] 273 | }, 274 | { 275 | "cell_type": "code", 276 | "execution_count": 8, 277 | "id": "58495df7", 278 | "metadata": { 279 | "execution": { 280 | "iopub.execute_input": "2022-11-05T08:25:29.085329Z", 281 | "iopub.status.busy": "2022-11-05T08:25:29.084522Z", 282 | "iopub.status.idle": "2022-11-05T08:25:29.094941Z", 283 | "shell.execute_reply": "2022-11-05T08:25:29.093411Z" 284 | }, 285 | "papermill": { 286 | "duration": 0.026067, 287 | "end_time": "2022-11-05T08:25:29.098176", 288 | "exception": false, 289 | "start_time": "2022-11-05T08:25:29.072109", 290 | "status": "completed" 291 | }, 292 | "tags": [] 293 | }, 294 | "outputs": [], 295 | "source": [ 296 | "cols = ['bedrooms',\"bathrooms\",\"floors\",\"price\"]\n", 297 | "\n", 298 | "for col in cols :\n", 299 | " data[col] = data[col].astype(int)\n", 300 | "\n", 301 | "# Because how can 1.50 bathroom exists" 302 | ] 303 | }, 304 | { 305 | "cell_type": "code", 306 | "execution_count": 9, 307 | "id": "101ec19d", 308 | "metadata": { 309 | "execution": { 310 | "iopub.execute_input": "2022-11-05T08:25:29.120976Z", 311 | "iopub.status.busy": "2022-11-05T08:25:29.120502Z", 312 | "iopub.status.idle": "2022-11-05T08:25:29.136886Z", 313 | "shell.execute_reply": "2022-11-05T08:25:29.135439Z" 314 | }, 315 | "papermill": { 316 | "duration": 0.031037, 317 | "end_time": "2022-11-05T08:25:29.139498", 318 | "exception": false, 319 | "start_time": "2022-11-05T08:25:29.108461", 320 | "status": "completed" 321 | }, 322 | "tags": [] 323 | }, 324 | "outputs": [ 325 | { 326 | "data": { 327 | "text/html": [ 328 | "
\n", 329 | "\n", 342 | "\n", 343 | " \n", 344 | " \n", 345 | " \n", 346 | " \n", 347 | " \n", 348 | " \n", 349 | " \n", 350 | " \n", 351 | " \n", 352 | " \n", 353 | " \n", 354 | " \n", 355 | " \n", 356 | " \n", 357 | " \n", 358 | " \n", 359 | " \n", 360 | " \n", 361 | " \n", 362 | " \n", 363 | " \n", 364 | " \n", 365 | " \n", 366 | " \n", 367 | " \n", 368 | " \n", 369 | " \n", 370 | " \n", 371 | " \n", 372 | " \n", 373 | " \n", 374 | " \n", 375 | " \n", 376 | " \n", 377 | " \n", 378 | " \n", 379 | " \n", 380 | " \n", 381 | " \n", 382 | " \n", 383 | " \n", 384 | " \n", 385 | " \n", 386 | " \n", 387 | " \n", 388 | " \n", 389 | " \n", 390 | " \n", 391 | " \n", 392 | " \n", 393 | " \n", 394 | " \n", 395 | " \n", 396 | " \n", 397 | " \n", 398 | " \n", 399 | " \n", 400 | " \n", 401 | " \n", 402 | " \n", 403 | " \n", 404 | " \n", 405 | " \n", 406 | " \n", 407 | " \n", 408 | " \n", 409 | " \n", 410 | " \n", 411 | " \n", 412 | " \n", 413 | " \n", 414 | " \n", 415 | " \n", 416 | " \n", 417 | " \n", 418 | " \n", 419 | " \n", 420 | " \n", 421 | " \n", 422 | " \n", 423 | " \n", 424 | " \n", 425 | " \n", 426 | " \n", 427 | " \n", 428 | " \n", 429 | " \n", 430 | " \n", 431 | " \n", 432 | " \n", 433 | " \n", 434 | " \n", 435 | " \n", 436 | " \n", 437 | " \n", 438 | " \n", 439 | " \n", 440 | " \n", 441 | " \n", 442 | " \n", 443 | "
pricebedroomsbathroomssqft_livingsqft_lotfloorswaterfrontviewconditionsqft_abovesqft_basementcitycity_new
03130003113407912100313400Shoreline36
12384000523650905020453370280Seattle35
234200032193011947100419300Kent18
34200003220008030100410001000Bellevue3
45500004219401050010041140800Redmond31
\n", 444 | "
" 445 | ], 446 | "text/plain": [ 447 | " price bedrooms bathrooms sqft_living sqft_lot floors waterfront \\\n", 448 | "0 313000 3 1 1340 7912 1 0 \n", 449 | "1 2384000 5 2 3650 9050 2 0 \n", 450 | "2 342000 3 2 1930 11947 1 0 \n", 451 | "3 420000 3 2 2000 8030 1 0 \n", 452 | "4 550000 4 2 1940 10500 1 0 \n", 453 | "\n", 454 | " view condition sqft_above sqft_basement city city_new \n", 455 | "0 0 3 1340 0 Shoreline 36 \n", 456 | "1 4 5 3370 280 Seattle 35 \n", 457 | "2 0 4 1930 0 Kent 18 \n", 458 | "3 0 4 1000 1000 Bellevue 3 \n", 459 | "4 0 4 1140 800 Redmond 31 " 460 | ] 461 | }, 462 | "execution_count": 9, 463 | "metadata": {}, 464 | "output_type": "execute_result" 465 | } 466 | ], 467 | "source": [ 468 | "data.head()" 469 | ] 470 | }, 471 | { 472 | "cell_type": "code", 473 | "execution_count": 10, 474 | "id": "ea52dc4b", 475 | "metadata": { 476 | "execution": { 477 | "iopub.execute_input": "2022-11-05T08:25:29.479804Z", 478 | "iopub.status.busy": "2022-11-05T08:25:29.478912Z", 479 | "iopub.status.idle": "2022-11-05T08:25:29.695123Z", 480 | "shell.execute_reply": "2022-11-05T08:25:29.693698Z" 481 | }, 482 | "papermill": { 483 | "duration": 0.231745, 484 | "end_time": "2022-11-05T08:25:29.698138", 485 | "exception": false, 486 | "start_time": "2022-11-05T08:25:29.466393", 487 | "status": "completed" 488 | }, 489 | "tags": [] 490 | }, 491 | "outputs": [ 492 | { 493 | "data": { 494 | "text/plain": [ 495 | "" 496 | ] 497 | }, 498 | "execution_count": 10, 499 | "metadata": {}, 500 | "output_type": "execute_result" 501 | }, 502 | { 503 | "data": { 504 | "image/png": "", 505 | "text/plain": [ 506 | "
" 507 | ] 508 | }, 509 | "metadata": {}, 510 | "output_type": "display_data" 511 | } 512 | ], 513 | "source": [ 514 | "sns.countplot(data=data,x=data['condition'])" 515 | ] 516 | }, 517 | { 518 | "cell_type": "code", 519 | "execution_count": 11, 520 | "id": "41e4d100", 521 | "metadata": { 522 | "execution": { 523 | "iopub.execute_input": "2022-11-05T08:25:30.328068Z", 524 | "iopub.status.busy": "2022-11-05T08:25:30.327436Z", 525 | "iopub.status.idle": "2022-11-05T08:25:30.337400Z", 526 | "shell.execute_reply": "2022-11-05T08:25:30.336508Z" 527 | }, 528 | "papermill": { 529 | "duration": 0.025507, 530 | "end_time": "2022-11-05T08:25:30.339545", 531 | "exception": false, 532 | "start_time": "2022-11-05T08:25:30.314038", 533 | "status": "completed" 534 | }, 535 | "tags": [] 536 | }, 537 | "outputs": [ 538 | { 539 | "data": { 540 | "text/plain": [ 541 | "city\n", 542 | "Seattle 1573\n", 543 | "Renton 293\n", 544 | "Bellevue 286\n", 545 | "Redmond 235\n", 546 | "Issaquah 187\n", 547 | "Kirkland 187\n", 548 | "Kent 185\n", 549 | "Auburn 176\n", 550 | "Sammamish 175\n", 551 | "Federal Way 148\n", 552 | "Shoreline 123\n", 553 | "Woodinville 115\n", 554 | "Maple Valley 96\n", 555 | "Mercer Island 86\n", 556 | "Burien 74\n", 557 | "Snoqualmie 71\n", 558 | "Kenmore 66\n", 559 | "Des Moines 58\n", 560 | "North Bend 50\n", 561 | "Covington 43\n", 562 | "Duvall 42\n", 563 | "Lake Forest Park 36\n", 564 | "Bothell 33\n", 565 | "Newcastle 33\n", 566 | "SeaTac 29\n", 567 | "Tukwila 29\n", 568 | "Vashon 29\n", 569 | "Enumclaw 28\n", 570 | "Carnation 22\n", 571 | "Normandy Park 18\n", 572 | "Clyde Hill 11\n", 573 | "Medina 11\n", 574 | "Fall City 11\n", 575 | "Black Diamond 9\n", 576 | "Ravensdale 7\n", 577 | "Pacific 6\n", 578 | "Algona 5\n", 579 | "Yarrow Point 4\n", 580 | "Skykomish 3\n", 581 | "Preston 2\n", 582 | "Milton 2\n", 583 | "Inglewood-Finn Hill 1\n", 584 | "Snoqualmie Pass 1\n", 585 | "Beaux Arts Village 1\n", 586 | "Name: count, dtype: int64" 587 | ] 588 | }, 589 | "execution_count": 11, 590 | "metadata": {}, 591 | "output_type": "execute_result" 592 | } 593 | ], 594 | "source": [ 595 | "data['city'].value_counts()" 596 | ] 597 | }, 598 | { 599 | "cell_type": "code", 600 | "execution_count": 12, 601 | "id": "8f160844", 602 | "metadata": { 603 | "execution": { 604 | "iopub.execute_input": "2022-11-05T08:25:30.365700Z", 605 | "iopub.status.busy": "2022-11-05T08:25:30.365038Z", 606 | "iopub.status.idle": "2022-11-05T08:25:30.602652Z", 607 | "shell.execute_reply": "2022-11-05T08:25:30.601799Z" 608 | }, 609 | "papermill": { 610 | "duration": 0.253522, 611 | "end_time": "2022-11-05T08:25:30.605014", 612 | "exception": false, 613 | "start_time": "2022-11-05T08:25:30.351492", 614 | "status": "completed" 615 | }, 616 | "tags": [] 617 | }, 618 | "outputs": [ 619 | { 620 | "data": { 621 | "text/plain": [ 622 | "" 623 | ] 624 | }, 625 | "execution_count": 12, 626 | "metadata": {}, 627 | "output_type": "execute_result" 628 | }, 629 | { 630 | "data": { 631 | "image/png": "", 632 | "text/plain": [ 633 | "
" 634 | ] 635 | }, 636 | "metadata": {}, 637 | "output_type": "display_data" 638 | } 639 | ], 640 | "source": [ 641 | "data['price'].plot(title='price Range')" 642 | ] 643 | }, 644 | { 645 | "cell_type": "code", 646 | "execution_count": 13, 647 | "id": "a67df3de", 648 | "metadata": { 649 | "execution": { 650 | "iopub.execute_input": "2022-11-05T08:25:30.632224Z", 651 | "iopub.status.busy": "2022-11-05T08:25:30.631444Z", 652 | "iopub.status.idle": "2022-11-05T08:25:30.638410Z", 653 | "shell.execute_reply": "2022-11-05T08:25:30.637266Z" 654 | }, 655 | "papermill": { 656 | "duration": 0.023171, 657 | "end_time": "2022-11-05T08:25:30.640841", 658 | "exception": false, 659 | "start_time": "2022-11-05T08:25:30.617670", 660 | "status": "completed" 661 | }, 662 | "tags": [] 663 | }, 664 | "outputs": [ 665 | { 666 | "data": { 667 | "text/plain": [ 668 | "551962.9754347826" 669 | ] 670 | }, 671 | "execution_count": 13, 672 | "metadata": {}, 673 | "output_type": "execute_result" 674 | } 675 | ], 676 | "source": [ 677 | "np.mean(data['price'])" 678 | ] 679 | }, 680 | { 681 | "cell_type": "code", 682 | "execution_count": 14, 683 | "id": "e93dadf9", 684 | "metadata": { 685 | "execution": { 686 | "iopub.execute_input": "2022-11-05T08:25:30.667111Z", 687 | "iopub.status.busy": "2022-11-05T08:25:30.666605Z", 688 | "iopub.status.idle": "2022-11-05T08:25:30.861896Z", 689 | "shell.execute_reply": "2022-11-05T08:25:30.860676Z" 690 | }, 691 | "papermill": { 692 | "duration": 0.21127, 693 | "end_time": "2022-11-05T08:25:30.864446", 694 | "exception": false, 695 | "start_time": "2022-11-05T08:25:30.653176", 696 | "status": "completed" 697 | }, 698 | "tags": [] 699 | }, 700 | "outputs": [ 701 | { 702 | "data": { 703 | "text/plain": [ 704 | "" 705 | ] 706 | }, 707 | "execution_count": 14, 708 | "metadata": {}, 709 | "output_type": "execute_result" 710 | }, 711 | { 712 | "data": { 713 | "image/png": "iVBORw0KGgoAAAANSUhEUgAAAkQAAAGwCAYAAABIC3rIAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjcuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8pXeV/AAAACXBIWXMAAA9hAAAPYQGoP6dpAAAlFklEQVR4nO3df3BU9b3/8dcmkCVIdmOEZJMSIooC4ZfXQHEvmuHXTUB0ZEpVlArUFEZvQgdjIc1cifzovbkFwV9F0PZidC5cwVoQgw3EIOGKATW3KT/EDHDphA5soECyECEJyd4/+uV8XYOoIcnZ8Hk+ZnaGc84nZ9+nk5Znd88ujkAgEBAAAIDBwuweAAAAwG4EEQAAMB5BBAAAjEcQAQAA4xFEAADAeAQRAAAwHkEEAACM18XuATqD5uZmHT9+XFFRUXI4HHaPAwAAvoNAIKBz584pISFBYWFXfw2IIPoOjh8/rsTERLvHAAAArXDs2DH17t37qmsIou8gKipK0t//A3W5XDZPAwAAvgu/36/ExETr7/GrIYi+g8tvk7lcLoIIAIBO5rvc7sJN1QAAwHgEEQAAMB5BBAAAjEcQAQAA4xFEAADAeAQRAAAwHkEEAACMRxABAADjEUQAAMB4BBEAADAeQQQAAIxHEAEAAOMRRAAAwHgEEQAAMB5BBAAAjNfF7gFMkjLvTbtHQAgpXzbd7hEAAP8PrxABAADjEUQAAMB4BBEAADAeQQQAAIxHEAEAAOMRRAAAwHgEEQAAMB5BBAAAjEcQAQAA4xFEAADAeAQRAAAwnq1BlJ+frxEjRigqKkqxsbGaPHmyKisrg9aMHj1aDocj6PHEE08EramqqtKkSZPUvXt3xcbGat68ebp06VLQmh07dujOO++U0+lUv379VFBQ0N6XBwAAOglbg6i0tFSZmZnavXu3iouL1djYqLS0NNXV1QWtmzVrlk6cOGE9li5dah1ramrSpEmT1NDQoI8//lhvvPGGCgoKlJeXZ605evSoJk2apDFjxqiiokJz587Vz372M23durXDrhUAAIQuW/+1+6KioqDtgoICxcbGqry8XKmpqdb+7t27y+PxXPEc27Zt0+eff64PPvhAcXFxuuOOO7RkyRLl5ORo4cKFioiI0OrVq9W3b18tX75ckjRw4EB99NFHev7555Went5+FwgAADqFkLqHqLa2VpIUExMTtH/t2rXq2bOnBg8erNzcXH355ZfWsbKyMg0ZMkRxcXHWvvT0dPn9fh04cMBaM378+KBzpqenq6ys7Ipz1NfXy+/3Bz0AAMD1y9ZXiL6qublZc+fO1ahRozR48GBr/6OPPqqkpCQlJCRo7969ysnJUWVlpf7whz9Iknw+X1AMSbK2fT7fVdf4/X5duHBBkZGRQcfy8/O1aNGiNr9GAAAQmkImiDIzM7V//3599NFHQftnz55t/XnIkCGKj4/XuHHjdOTIEd16663tMktubq6ys7Otbb/fr8TExHZ5LgAAYL+QeMssKytLhYWF+vDDD9W7d++rrh05cqQk6fDhw5Ikj8ej6urqoDWXty/fd/RNa1wuV4tXhyTJ6XTK5XIFPQAAwPXL1iAKBALKysrSxo0btX37dvXt2/dbf6aiokKSFB8fL0nyer3at2+fTp48aa0pLi6Wy+VScnKytaakpCToPMXFxfJ6vW10JQAAoDOzNYgyMzP1n//5n1q3bp2ioqLk8/nk8/l04cIFSdKRI0e0ZMkSlZeX6y9/+Ys2b96s6dOnKzU1VUOHDpUkpaWlKTk5WY899pj+/Oc/a+vWrXrmmWeUmZkpp9MpSXriiSf0v//7v5o/f76++OILvfLKK9qwYYOeeuop264dAACEDluDaNWqVaqtrdXo0aMVHx9vPdavXy9JioiI0AcffKC0tDQNGDBATz/9tKZMmaL33nvPOkd4eLgKCwsVHh4ur9ern/zkJ5o+fboWL15srenbt6+2bNmi4uJiDRs2TMuXL9fvfvc7PnIPAAAkSY5AIBCwe4hQ5/f75Xa7VVtbe033E6XMe7MNp0JnV75sut0jAMB17fv8/R0SN1UDAADYiSACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAYjyACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAYjyACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAYjyACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAYjyACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDxbgyg/P18jRoxQVFSUYmNjNXnyZFVWVgatuXjxojIzM3XTTTepR48emjJliqqrq4PWVFVVadKkSerevbtiY2M1b948Xbp0KWjNjh07dOedd8rpdKpfv34qKCho78sDAACdhK1BVFpaqszMTO3evVvFxcVqbGxUWlqa6urqrDVPPfWU3nvvPb399tsqLS3V8ePH9aMf/cg63tTUpEmTJqmhoUEff/yx3njjDRUUFCgvL89ac/ToUU2aNEljxoxRRUWF5s6dq5/97GfaunVrh14vAAAITY5AIBCwe4jLTp06pdjYWJWWlio1NVW1tbXq1auX1q1bpx//+MeSpC+++EIDBw5UWVmZ7rrrLv3xj3/Ufffdp+PHjysuLk6StHr1auXk5OjUqVOKiIhQTk6OtmzZov3791vPNXXqVNXU1KioqOhb5/L7/XK73aqtrZXL5Wr19aXMe7PVP4vrT/my6XaPAADXte/z93dI3UNUW1srSYqJiZEklZeXq7GxUePHj7fWDBgwQH369FFZWZkkqaysTEOGDLFiSJLS09Pl9/t14MABa81Xz3F5zeVzfF19fb38fn/QAwAAXL9CJoiam5s1d+5cjRo1SoMHD5Yk+Xw+RUREKDo6OmhtXFycfD6ftearMXT5+OVjV1vj9/t14cKFFrPk5+fL7XZbj8TExDa5RgAAEJpCJogyMzO1f/9+vfXWW3aPotzcXNXW1lqPY8eO2T0SAABoR13sHkCSsrKyVFhYqJ07d6p3797Wfo/Ho4aGBtXU1AS9SlRdXS2Px2Ot+eSTT4LOd/lTaF9d8/VPplVXV8vlcikyMrLFPE6nU06ns02uDQAAhD5bXyEKBALKysrSxo0btX37dvXt2zfoeEpKirp27aqSkhJrX2VlpaqqquT1eiVJXq9X+/bt08mTJ601xcXFcrlcSk5OttZ89RyX11w+BwAAMJutrxBlZmZq3bp1evfddxUVFWXd8+N2uxUZGSm3262MjAxlZ2crJiZGLpdLc+bMkdfr1V133SVJSktLU3Jysh577DEtXbpUPp9PzzzzjDIzM61XeZ544gn95je/0fz58/X4449r+/bt2rBhg7Zs2WLbtQMAgNBh6ytEq1atUm1trUaPHq34+HjrsX79emvN888/r/vuu09TpkxRamqqPB6P/vCHP1jHw8PDVVhYqPDwcHm9Xv3kJz/R9OnTtXjxYmtN3759tWXLFhUXF2vYsGFavny5fve73yk9Pb1DrxcAAISmkPoeolDF9xChPfA9RADQvjrt9xABAADYgSACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAYr4vdAwCwT9XiIXaPgBDTJ2+f3SMAtuAVIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAYjyACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAYjyACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAYjyACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAYz9Yg2rlzp+6//34lJCTI4XBo06ZNQcdnzpwph8MR9JgwYULQmjNnzmjatGlyuVyKjo5WRkaGzp8/H7Rm7969uueee9StWzclJiZq6dKl7X1pAACgE7E1iOrq6jRs2DCtXLnyG9dMmDBBJ06csB7/9V//FXR82rRpOnDggIqLi1VYWKidO3dq9uzZ1nG/36+0tDQlJSWpvLxcy5Yt08KFC/Xaa6+123UBAIDOpYudTz5x4kRNnDjxqmucTqc8Hs8Vjx08eFBFRUX69NNPNXz4cEnSyy+/rHvvvVfPPfecEhIStHbtWjU0NGjNmjWKiIjQoEGDVFFRoRUrVgSFEwAAMFfI30O0Y8cOxcbGqn///nryySd1+vRp61hZWZmio6OtGJKk8ePHKywsTHv27LHWpKamKiIiwlqTnp6uyspKnT179orPWV9fL7/fH/QAAADXr1YF0dixY1VTU9Niv9/v19ixY691JsuECRP05ptvqqSkRL/+9a9VWlqqiRMnqqmpSZLk8/kUGxsb9DNdunRRTEyMfD6ftSYuLi5ozeXty2u+Lj8/X26323okJia22TUBAIDQ06q3zHbs2KGGhoYW+y9evKj//u//vuahLps6dar15yFDhmjo0KG69dZbtWPHDo0bN67NnufrcnNzlZ2dbW37/X6iCACA69j3CqK9e/daf/7888+DXmFpampSUVGRfvCDH7TddF9zyy23qGfPnjp8+LDGjRsnj8ejkydPBq25dOmSzpw5Y9135PF4VF1dHbTm8vY33ZvkdDrldDrb4QoAAEAo+l5BdMcdd1gff7/SW2ORkZF6+eWX22y4r/vrX/+q06dPKz4+XpLk9XpVU1Oj8vJypaSkSJK2b9+u5uZmjRw50lrzL//yL2psbFTXrl0lScXFxerfv79uvPHGdpsVAAB0Ht8riI4ePapAIKBbbrlFn3zyiXr16mUdi4iIUGxsrMLDw7/z+c6fP6/Dhw8Hnb+iokIxMTGKiYnRokWLNGXKFHk8Hh05ckTz589Xv379lJ6eLkkaOHCgJkyYoFmzZmn16tVqbGxUVlaWpk6dqoSEBEnSo48+qkWLFikjI0M5OTnav3+/XnzxRT3//PPf59IBAMB17HsFUVJSkiSpubm5TZ78s88+05gxY6zty/ftzJgxQ6tWrdLevXv1xhtvqKamRgkJCUpLS9OSJUuC3s5au3atsrKyNG7cOIWFhWnKlCl66aWXrONut1vbtm1TZmamUlJS1LNnT+Xl5fGRewAAYGn19xAdOnRIH374oU6ePNkikPLy8r7TOUaPHq1AIPCNx7du3fqt54iJidG6deuuumbo0KFterM3AAC4vrQqiH7729/qySefVM+ePeXxeORwOKxjDofjOwcRAABAKGhVEP3qV7/Sv/7rvyonJ6et5wEAAOhwrfpixrNnz+rBBx9s61kAAABs0aogevDBB7Vt27a2ngUAAMAWrXrLrF+/flqwYIF2796tIUOGWN/vc9nPf/7zNhkOAACgI7QqiF577TX16NFDpaWlKi0tDTrmcDgIIgAA0Km0KoiOHj3a1nMAAADYplX3EAEAAFxPWvUK0eOPP37V42vWrGnVMAAAAHZoVRCdPXs2aLuxsVH79+9XTU3NFf/RVwAAgFDWqiDauHFji33Nzc168skndeutt17zUAAAAB2pze4hCgsLU3Z2Nv+KPAAA6HTa9KbqI0eO6NKlS215SgAAgHbXqrfMsrOzg7YDgYBOnDihLVu2aMaMGW0yGAAAQEdpVRD96U9/CtoOCwtTr169tHz58m/9BBoAAECoaVUQffjhh209BwAAgG1aFUSXnTp1SpWVlZKk/v37q1evXm0yFAAAQEdq1U3VdXV1evzxxxUfH6/U1FSlpqYqISFBGRkZ+vLLL9t6RgAAgHbVqiDKzs5WaWmp3nvvPdXU1KimpkbvvvuuSktL9fTTT7f1jAAAAO2qVW+ZvfPOO/r973+v0aNHW/vuvfdeRUZG6qGHHtKqVavaaj4AAIB216pXiL788kvFxcW12B8bG8tbZgAAoNNpVRB5vV49++yzunjxorXvwoULWrRokbxeb5sNBwAA0BFa9ZbZCy+8oAkTJqh3794aNmyYJOnPf/6znE6ntm3b1qYDAgAAtLdWBdGQIUN06NAhrV27Vl988YUk6ZFHHtG0adMUGRnZpgMCAAC0t1YFUX5+vuLi4jRr1qyg/WvWrNGpU6eUk5PTJsMBAAB0hFbdQ/Tqq69qwIABLfYPGjRIq1evvuahAAAAOlKrgsjn8yk+Pr7F/l69eunEiRPXPBQAAEBHalUQJSYmateuXS3279q1SwkJCdc8FAAAQEdq1T1Es2bN0ty5c9XY2KixY8dKkkpKSjR//ny+qRoAAHQ6rQqiefPm6fTp0/rnf/5nNTQ0SJK6deumnJwc5ebmtumAAAAA7a1VQeRwOPTrX/9aCxYs0MGDBxUZGanbbrtNTqezrecDAABod60Kost69OihESNGtNUsAAAAtmjVTdUAAADXE4IIAAAYjyACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAYjyACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPFuDaOfOnbr//vuVkJAgh8OhTZs2BR0PBALKy8tTfHy8IiMjNX78eB06dChozZkzZzRt2jS5XC5FR0crIyND58+fD1qzd+9e3XPPPerWrZsSExO1dOnS9r40AADQidgaRHV1dRo2bJhWrlx5xeNLly7VSy+9pNWrV2vPnj264YYblJ6erosXL1prpk2bpgMHDqi4uFiFhYXauXOnZs+ebR33+/1KS0tTUlKSysvLtWzZMi1cuFCvvfZau18fAADoHLrY+eQTJ07UxIkTr3gsEAjohRde0DPPPKMHHnhAkvTmm28qLi5OmzZt0tSpU3Xw4EEVFRXp008/1fDhwyVJL7/8su69914999xzSkhI0Nq1a9XQ0KA1a9YoIiJCgwYNUkVFhVasWBEUTl9VX1+v+vp6a9vv97fxlQMAgFASsvcQHT16VD6fT+PHj7f2ud1ujRw5UmVlZZKksrIyRUdHWzEkSePHj1dYWJj27NljrUlNTVVERIS1Jj09XZWVlTp79uwVnzs/P19ut9t6JCYmtsclAgCAEBGyQeTz+SRJcXFxQfvj4uKsYz6fT7GxsUHHu3TpopiYmKA1VzrHV5/j63Jzc1VbW2s9jh07du0XBAAAQpatb5mFKqfTKafTafcYAACgg4TsK0Qej0eSVF1dHbS/urraOubxeHTy5Mmg45cuXdKZM2eC1lzpHF99DgAAYLaQDaK+ffvK4/GopKTE2uf3+7Vnzx55vV5JktfrVU1NjcrLy60127dvV3Nzs0aOHGmt2blzpxobG601xcXF6t+/v2688cYOuhoAABDKbA2i8+fPq6KiQhUVFZL+fiN1RUWFqqqq5HA4NHfuXP3qV7/S5s2btW/fPk2fPl0JCQmaPHmyJGngwIGaMGGCZs2apU8++US7du1SVlaWpk6dqoSEBEnSo48+qoiICGVkZOjAgQNav369XnzxRWVnZ9t01QAAINTYeg/RZ599pjFjxljblyNlxowZKigo0Pz581VXV6fZs2erpqZGd999t4qKitStWzfrZ9auXausrCyNGzdOYWFhmjJlil566SXruNvt1rZt25SZmamUlBT17NlTeXl53/iRewAAYB5HIBAI2D1EqPP7/XK73aqtrZXL5Wr1eVLmvdmGU6GzK1823e4RVLV4iN0jIMT0ydtn9whAm/k+f3+H7D1EAAAAHYUgAgAAxiOIAACA8QgiAABgPIIIAAAYjyACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAYjyACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAYjyACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAYjyACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAYjyACAADGI4gAAIDxCCIAAGC8kA6ihQsXyuFwBD0GDBhgHb948aIyMzN10003qUePHpoyZYqqq6uDzlFVVaVJkyape/fuio2N1bx583Tp0qWOvhQAABDCutg9wLcZNGiQPvjgA2u7S5f/P/JTTz2lLVu26O2335bb7VZWVpZ+9KMfadeuXZKkpqYmTZo0SR6PRx9//LFOnDih6dOnq2vXrvq3f/u3Dr8WAAAQmkI+iLp06SKPx9Nif21trf7jP/5D69at09ixYyVJr7/+ugYOHKjdu3frrrvu0rZt2/T555/rgw8+UFxcnO644w4tWbJEOTk5WrhwoSIiIq74nPX19aqvr7e2/X5/+1wcAAAICSH9lpkkHTp0SAkJCbrllls0bdo0VVVVSZLKy8vV2Nio8ePHW2sHDBigPn36qKysTJJUVlamIUOGKC4uzlqTnp4uv9+vAwcOfONz5ufny+12W4/ExMR2ujoAABAKQjqIRo4cqYKCAhUVFWnVqlU6evSo7rnnHp07d04+n08RERGKjo4O+pm4uDj5fD5Jks/nC4qhy8cvH/smubm5qq2ttR7Hjh1r2wsDAAAhJaTfMps4caL156FDh2rkyJFKSkrShg0bFBkZ2W7P63Q65XQ62+38AAAgtIT0K0RfFx0drdtvv12HDx+Wx+NRQ0ODampqgtZUV1db9xx5PJ4Wnzq7vH2l+5IAAICZOlUQnT9/XkeOHFF8fLxSUlLUtWtXlZSUWMcrKytVVVUlr9crSfJ6vdq3b59OnjxprSkuLpbL5VJycnKHzw8AAEJTSL9l9otf/EL333+/kpKSdPz4cT377LMKDw/XI488IrfbrYyMDGVnZysmJkYul0tz5syR1+vVXXfdJUlKS0tTcnKyHnvsMS1dulQ+n0/PPPOMMjMzeUsMAABYQjqI/vrXv+qRRx7R6dOn1atXL919993avXu3evXqJUl6/vnnFRYWpilTpqi+vl7p6el65ZVXrJ8PDw9XYWGhnnzySXm9Xt1www2aMWOGFi9ebNclAQCAEBTSQfTWW29d9Xi3bt20cuVKrVy58hvXJCUl6f3332/r0QAAwHWkU91DBAAA0B4IIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAYjyACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAYjyACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAYjyACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgvC52DwAAwFeNenmU3SMghOyas6tDnodXiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAYjyACAADGI4gAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPGMCqKVK1fq5ptvVrdu3TRy5Eh98skndo8EAABCgDFBtH79emVnZ+vZZ5/V//zP/2jYsGFKT0/XyZMn7R4NAADYzJggWrFihWbNmqWf/vSnSk5O1urVq9W9e3etWbPG7tEAAIDNutg9QEdoaGhQeXm5cnNzrX1hYWEaP368ysrKWqyvr69XfX29tV1bWytJ8vv91zRHU/2Fa/p5XF+u9fepLZy72GT3CAgxofB7eenCJbtHQAi5lt/Jyz8bCAS+da0RQfS3v/1NTU1NiouLC9ofFxenL774osX6/Px8LVq0qMX+xMTEdpsR5nG//ITdIwAt5bvtngAI4s659t/Jc+fOye2++nmMCKLvKzc3V9nZ2dZ2c3Ozzpw5o5tuukkOh8PGyTo/v9+vxMREHTt2TC6Xy+5xAH4nEZL4vWwbgUBA586dU0JCwreuNSKIevbsqfDwcFVXVwftr66ulsfjabHe6XTK6XQG7YuOjm7PEY3jcrn4LzlCCr+TCEX8Xl67b3tl6DIjbqqOiIhQSkqKSkpKrH3Nzc0qKSmR1+u1cTIAABAKjHiFSJKys7M1Y8YMDR8+XD/84Q/1wgsvqK6uTj/96U/tHg0AANjMmCB6+OGHderUKeXl5cnn8+mOO+5QUVFRixut0b6cTqeeffbZFm9JAnbhdxKhiN/LjucIfJfPogEAAFzHjLiHCAAA4GoIIgAAYDyCCAAAGI8gAgAAxiOI0CF27typ+++/XwkJCXI4HNq0aZPdI8Fw+fn5GjFihKKiohQbG6vJkyersrLS7rFgsFWrVmno0KHWlzF6vV798Y9/tHssYxBE6BB1dXUaNmyYVq5cafcogCSptLRUmZmZ2r17t4qLi9XY2Ki0tDTV1dXZPRoM1bt3b/37v/+7ysvL9dlnn2ns2LF64IEHdODAAbtHMwIfu0eHczgc2rhxoyZPnmz3KIDl1KlTio2NVWlpqVJTU+0eB5AkxcTEaNmyZcrIyLB7lOueMV/MCABXU1tbK+nvfwEBdmtqatLbb7+turo6/ompDkIQATBec3Oz5s6dq1GjRmnw4MF2jwOD7du3T16vVxcvXlSPHj20ceNGJScn2z2WEQgiAMbLzMzU/v379dFHH9k9CgzXv39/VVRUqLa2Vr///e81Y8YMlZaWEkUdgCACYLSsrCwVFhZq586d6t27t93jwHARERHq16+fJCklJUWffvqpXnzxRb366qs2T3b9I4gAGCkQCGjOnDnauHGjduzYob59+9o9EtBCc3Oz6uvr7R7DCAQROsT58+d1+PBha/vo0aOqqKhQTEyM+vTpY+NkMFVmZqbWrVund999V1FRUfL5fJIkt9utyMhIm6eDiXJzczVx4kT16dNH586d07p167Rjxw5t3brV7tGMwMfu0SF27NihMWPGtNg/Y8YMFRQUdPxAMJ7D4bji/tdff10zZ87s2GEASRkZGSopKdGJEyfkdrs1dOhQ5eTk6J/+6Z/sHs0IBBEAADAe31QNAACMRxABAADjEUQAAMB4BBEAADAeQQQAAIxHEAEAAOMRRAAAwHgEEQAAMB5BBKDTCgQCmj17tmJiYuRwOBQdHa25c+faPRaAToggAtBpFRUVqaCgQIWFhTpx4oQGDx5s90gAOin+cVcAndaRI0cUHx+vf/zHf5QkdenS/v+T1tDQoIiIiHZ/HgAdi1eIAHRKM2fO1Jw5c1RVVSWHw6Gbb765xZqzZ89q+vTpuvHGG9W9e3dNnDhRhw4dClrzzjvvaNCgQXI6nbr55pu1fPnyoOM333yzlixZounTp8vlcmn27NlqaGhQVlaW4uPj1a1bNyUlJSk/P789LxdAOyOIAHRKL774ohYvXqzevXvrxIkT+vTTT1usmTlzpj777DNt3rxZZWVlCgQCuvfee9XY2ChJKi8v10MPPaSpU6dq3759WrhwoRYsWKCCgoKg8zz33HMaNmyY/vSnP2nBggV66aWXtHnzZm3YsEGVlZVau3btFYMMQOfBW2YAOiW3262oqCiFh4fL4/G0OH7o0CFt3rxZu3btst5SW7t2rRITE7Vp0yY9+OCDWrFihcaNG6cFCxZIkm6//XZ9/vnnWrZsmWbOnGmda+zYsXr66aet7aqqKt122226++675XA4lJSU1L4XC6Dd8QoRgOvSwYMH1aVLF40cOdLad9NNN6l///46ePCgtWbUqFFBPzdq1CgdOnRITU1N1r7hw4cHrZk5c6YqKirUv39//fznP9e2bdva8UoAdASCCAC+xQ033BC0feedd+ro0aNasmSJLly4oIceekg//vGPbZoOQFsgiABclwYOHKhLly5pz5491r7Tp0+rsrJSycnJ1ppdu3YF/dyuXbt0++23Kzw8/Krnd7lcevjhh/Xb3/5W69ev1zvvvKMzZ860/YUA6BDcQwTgunTbbbfpgQce0KxZs/Tqq68qKipKv/zlL/WDH/xADzzwgCTp6aef1ogRI7RkyRI9/PDDKisr029+8xu98sorVz33ihUrFB8fr3/4h39QWFiY3n77bXk8HkVHR3fAlQFoD7xCBOC69frrryslJUX33XefvF6vAoGA3n//fXXt2lXS39/62rBhg9566y0NHjxYeXl5Wrx4cdAN1VcSFRWlpUuXavjw4RoxYoT+8pe/6P3331dYGP+TCnRWjkAgELB7CAAAADvxf2cAAIDxCCIAAGA8gggAABiPIAIAAMYjiAAAgPEIIgAAYDyCCAAAGI8gAgAAxiOIAACA8QgiAABgPIIIAAAY7/8AX8u1/ILIqEMAAAAASUVORK5CYII=", 714 | "text/plain": [ 715 | "
" 716 | ] 717 | }, 718 | "metadata": {}, 719 | "output_type": "display_data" 720 | } 721 | ], 722 | "source": [ 723 | "sns.countplot(data=data,x=data['floors'])" 724 | ] 725 | }, 726 | { 727 | "cell_type": "code", 728 | "execution_count": 15, 729 | "id": "9b40aea2", 730 | "metadata": { 731 | "execution": { 732 | "iopub.execute_input": "2022-11-05T08:25:30.891036Z", 733 | "iopub.status.busy": "2022-11-05T08:25:30.889937Z", 734 | "iopub.status.idle": "2022-11-05T08:25:31.110151Z", 735 | "shell.execute_reply": "2022-11-05T08:25:31.109298Z" 736 | }, 737 | "papermill": { 738 | "duration": 0.236117, 739 | "end_time": "2022-11-05T08:25:31.112606", 740 | "exception": false, 741 | "start_time": "2022-11-05T08:25:30.876489", 742 | "status": "completed" 743 | }, 744 | "tags": [] 745 | }, 746 | "outputs": [ 747 | { 748 | "data": { 749 | "text/plain": [ 750 | "" 751 | ] 752 | }, 753 | "execution_count": 15, 754 | "metadata": {}, 755 | "output_type": "execute_result" 756 | }, 757 | { 758 | "data": { 759 | "image/png": "", 760 | "text/plain": [ 761 | "
" 762 | ] 763 | }, 764 | "metadata": {}, 765 | "output_type": "display_data" 766 | } 767 | ], 768 | "source": [ 769 | "sns.countplot(data=data,x=data['bathrooms'])" 770 | ] 771 | }, 772 | { 773 | "cell_type": "code", 774 | "execution_count": 16, 775 | "id": "ecc0c0fa", 776 | "metadata": { 777 | "execution": { 778 | "iopub.execute_input": "2022-11-05T08:25:31.140448Z", 779 | "iopub.status.busy": "2022-11-05T08:25:31.139323Z", 780 | "iopub.status.idle": "2022-11-05T08:25:31.391756Z", 781 | "shell.execute_reply": "2022-11-05T08:25:31.390457Z" 782 | }, 783 | "papermill": { 784 | "duration": 0.26891, 785 | "end_time": "2022-11-05T08:25:31.394121", 786 | "exception": false, 787 | "start_time": "2022-11-05T08:25:31.125211", 788 | "status": "completed" 789 | }, 790 | "tags": [] 791 | }, 792 | "outputs": [ 793 | { 794 | "data": { 795 | "text/plain": [ 796 | "" 797 | ] 798 | }, 799 | "execution_count": 16, 800 | "metadata": {}, 801 | "output_type": "execute_result" 802 | }, 803 | { 804 | "data": { 805 | "image/png": "", 806 | "text/plain": [ 807 | "
" 808 | ] 809 | }, 810 | "metadata": {}, 811 | "output_type": "display_data" 812 | } 813 | ], 814 | "source": [ 815 | "sns.countplot(data=data,x=data['bedrooms'])" 816 | ] 817 | }, 818 | { 819 | "cell_type": "code", 820 | "execution_count": 17, 821 | "id": "d491175d", 822 | "metadata": { 823 | "execution": { 824 | "iopub.execute_input": "2022-11-05T08:25:31.421492Z", 825 | "iopub.status.busy": "2022-11-05T08:25:31.421059Z", 826 | "iopub.status.idle": "2022-11-05T08:25:31.604739Z", 827 | "shell.execute_reply": "2022-11-05T08:25:31.603899Z" 828 | }, 829 | "papermill": { 830 | "duration": 0.200317, 831 | "end_time": "2022-11-05T08:25:31.607467", 832 | "exception": false, 833 | "start_time": "2022-11-05T08:25:31.407150", 834 | "status": "completed" 835 | }, 836 | "tags": [] 837 | }, 838 | "outputs": [ 839 | { 840 | "data": { 841 | "text/plain": [ 842 | "" 843 | ] 844 | }, 845 | "execution_count": 17, 846 | "metadata": {}, 847 | "output_type": "execute_result" 848 | }, 849 | { 850 | "data": { 851 | "image/png": "", 852 | "text/plain": [ 853 | "
" 854 | ] 855 | }, 856 | "metadata": {}, 857 | "output_type": "display_data" 858 | } 859 | ], 860 | "source": [ 861 | "sns.countplot(data=data,x=data['waterfront'])" 862 | ] 863 | }, 864 | { 865 | "cell_type": "markdown", 866 | "id": "160e09e0", 867 | "metadata": { 868 | "papermill": { 869 | "duration": 0.013553, 870 | "end_time": "2022-11-05T08:25:31.660822", 871 | "exception": false, 872 | "start_time": "2022-11-05T08:25:31.647269", 873 | "status": "completed" 874 | }, 875 | "tags": [] 876 | }, 877 | "source": [ 878 | "## Model Creation" 879 | ] 880 | }, 881 | { 882 | "cell_type": "code", 883 | "execution_count": 18, 884 | "id": "a00ed84d", 885 | "metadata": { 886 | "execution": { 887 | "iopub.execute_input": "2022-11-05T08:25:31.689713Z", 888 | "iopub.status.busy": "2022-11-05T08:25:31.689309Z", 889 | "iopub.status.idle": "2022-11-05T08:25:31.699095Z", 890 | "shell.execute_reply": "2022-11-05T08:25:31.698235Z" 891 | }, 892 | "papermill": { 893 | "duration": 0.027012, 894 | "end_time": "2022-11-05T08:25:31.701749", 895 | "exception": false, 896 | "start_time": "2022-11-05T08:25:31.674737", 897 | "status": "completed" 898 | }, 899 | "tags": [] 900 | }, 901 | "outputs": [ 902 | { 903 | "data": { 904 | "text/plain": [ 905 | "sqft_basement\n", 906 | "0 2745\n", 907 | "500 53\n", 908 | "600 45\n", 909 | "800 43\n", 910 | "900 41\n", 911 | " ... \n", 912 | "2300 1\n", 913 | "265 1\n", 914 | "1610 1\n", 915 | "862 1\n", 916 | "1640 1\n", 917 | "Name: count, Length: 207, dtype: int64" 918 | ] 919 | }, 920 | "execution_count": 18, 921 | "metadata": {}, 922 | "output_type": "execute_result" 923 | } 924 | ], 925 | "source": [ 926 | "data['sqft_basement'].value_counts()" 927 | ] 928 | }, 929 | { 930 | "cell_type": "code", 931 | "execution_count": 19, 932 | "id": "cf79255f", 933 | "metadata": { 934 | "execution": { 935 | "iopub.execute_input": "2022-11-05T08:25:31.731019Z", 936 | "iopub.status.busy": "2022-11-05T08:25:31.730556Z", 937 | "iopub.status.idle": "2022-11-05T08:25:31.738304Z", 938 | "shell.execute_reply": "2022-11-05T08:25:31.736852Z" 939 | }, 940 | "papermill": { 941 | "duration": 0.025349, 942 | "end_time": "2022-11-05T08:25:31.740891", 943 | "exception": false, 944 | "start_time": "2022-11-05T08:25:31.715542", 945 | "status": "completed" 946 | }, 947 | "tags": [] 948 | }, 949 | "outputs": [], 950 | "source": [ 951 | "data = data.drop([\"city\",\"view\",\"waterfront\",\"sqft_basement\"],axis=1)" 952 | ] 953 | }, 954 | { 955 | "cell_type": "code", 956 | "execution_count": 20, 957 | "id": "40dce89c", 958 | "metadata": { 959 | "execution": { 960 | "iopub.execute_input": "2022-11-05T08:25:31.822281Z", 961 | "iopub.status.busy": "2022-11-05T08:25:31.821767Z", 962 | "iopub.status.idle": "2022-11-05T08:25:31.829605Z", 963 | "shell.execute_reply": "2022-11-05T08:25:31.828190Z" 964 | }, 965 | "papermill": { 966 | "duration": 0.025326, 967 | "end_time": "2022-11-05T08:25:31.832232", 968 | "exception": false, 969 | "start_time": "2022-11-05T08:25:31.806906", 970 | "status": "completed" 971 | }, 972 | "tags": [] 973 | }, 974 | "outputs": [], 975 | "source": [ 976 | "x = np.array(data.loc[:,data.columns != \"price\"].values)\n", 977 | "y = np.array(data[\"price\"].values)" 978 | ] 979 | }, 980 | { 981 | "cell_type": "code", 982 | "execution_count": 21, 983 | "id": "2cada5be", 984 | "metadata": { 985 | "execution": { 986 | "iopub.execute_input": "2022-11-05T08:25:31.860997Z", 987 | "iopub.status.busy": "2022-11-05T08:25:31.860507Z", 988 | "iopub.status.idle": "2022-11-05T08:25:31.868697Z", 989 | "shell.execute_reply": "2022-11-05T08:25:31.867705Z" 990 | }, 991 | "papermill": { 992 | "duration": 0.02536, 993 | "end_time": "2022-11-05T08:25:31.871073", 994 | "exception": false, 995 | "start_time": "2022-11-05T08:25:31.845713", 996 | "status": "completed" 997 | }, 998 | "tags": [] 999 | }, 1000 | "outputs": [ 1001 | { 1002 | "data": { 1003 | "text/plain": [ 1004 | "array([[ 3, 1, 1340, ..., 3, 1340, 36],\n", 1005 | " [ 5, 2, 3650, ..., 5, 3370, 35],\n", 1006 | " [ 3, 2, 1930, ..., 4, 1930, 18],\n", 1007 | " ...,\n", 1008 | " [ 3, 2, 3010, ..., 3, 3010, 32],\n", 1009 | " [ 4, 2, 2090, ..., 3, 1070, 35],\n", 1010 | " [ 3, 2, 1490, ..., 4, 1490, 9]], dtype=int64)" 1011 | ] 1012 | }, 1013 | "execution_count": 21, 1014 | "metadata": {}, 1015 | "output_type": "execute_result" 1016 | } 1017 | ], 1018 | "source": [ 1019 | "x" 1020 | ] 1021 | }, 1022 | { 1023 | "cell_type": "code", 1024 | "execution_count": 22, 1025 | "id": "2dba4b6c", 1026 | "metadata": { 1027 | "execution": { 1028 | "iopub.execute_input": "2022-11-05T08:25:31.899555Z", 1029 | "iopub.status.busy": "2022-11-05T08:25:31.899146Z", 1030 | "iopub.status.idle": "2022-11-05T08:25:31.905957Z", 1031 | "shell.execute_reply": "2022-11-05T08:25:31.904792Z" 1032 | }, 1033 | "papermill": { 1034 | "duration": 0.024129, 1035 | "end_time": "2022-11-05T08:25:31.908496", 1036 | "exception": false, 1037 | "start_time": "2022-11-05T08:25:31.884367", 1038 | "status": "completed" 1039 | }, 1040 | "tags": [] 1041 | }, 1042 | "outputs": [ 1043 | { 1044 | "data": { 1045 | "text/plain": [ 1046 | "array([ 313000, 2384000, 342000, ..., 416904, 203400, 220600])" 1047 | ] 1048 | }, 1049 | "execution_count": 22, 1050 | "metadata": {}, 1051 | "output_type": "execute_result" 1052 | } 1053 | ], 1054 | "source": [ 1055 | "y" 1056 | ] 1057 | }, 1058 | { 1059 | "cell_type": "code", 1060 | "execution_count": 23, 1061 | "id": "03618f50", 1062 | "metadata": { 1063 | "execution": { 1064 | "iopub.execute_input": "2022-11-05T08:25:31.937320Z", 1065 | "iopub.status.busy": "2022-11-05T08:25:31.936881Z", 1066 | "iopub.status.idle": "2022-11-05T08:25:31.944616Z", 1067 | "shell.execute_reply": "2022-11-05T08:25:31.943245Z" 1068 | }, 1069 | "papermill": { 1070 | "duration": 0.024941, 1071 | "end_time": "2022-11-05T08:25:31.947081", 1072 | "exception": false, 1073 | "start_time": "2022-11-05T08:25:31.922140", 1074 | "status": "completed" 1075 | }, 1076 | "tags": [] 1077 | }, 1078 | "outputs": [], 1079 | "source": [ 1080 | "x_train,x_test,y_train,y_test = train_test_split(x,y,test_size=0.1,random_state=42)" 1081 | ] 1082 | }, 1083 | { 1084 | "cell_type": "code", 1085 | "execution_count": 24, 1086 | "id": "17dbd7a0", 1087 | "metadata": { 1088 | "execution": { 1089 | "iopub.execute_input": "2022-11-05T08:25:31.975637Z", 1090 | "iopub.status.busy": "2022-11-05T08:25:31.975207Z", 1091 | "iopub.status.idle": "2022-11-05T08:25:31.982824Z", 1092 | "shell.execute_reply": "2022-11-05T08:25:31.981979Z" 1093 | }, 1094 | "papermill": { 1095 | "duration": 0.024459, 1096 | "end_time": "2022-11-05T08:25:31.984999", 1097 | "exception": false, 1098 | "start_time": "2022-11-05T08:25:31.960540", 1099 | "status": "completed" 1100 | }, 1101 | "tags": [] 1102 | }, 1103 | "outputs": [ 1104 | { 1105 | "data": { 1106 | "text/plain": [ 1107 | "array([[ 3, 1, 1340, ..., 3, 1340, 36],\n", 1108 | " [ 5, 2, 3650, ..., 5, 3370, 35],\n", 1109 | " [ 3, 2, 1930, ..., 4, 1930, 18],\n", 1110 | " ...,\n", 1111 | " [ 3, 2, 3010, ..., 3, 3010, 32],\n", 1112 | " [ 4, 2, 2090, ..., 3, 1070, 35],\n", 1113 | " [ 3, 2, 1490, ..., 4, 1490, 9]], dtype=int64)" 1114 | ] 1115 | }, 1116 | "execution_count": 24, 1117 | "metadata": {}, 1118 | "output_type": "execute_result" 1119 | } 1120 | ], 1121 | "source": [ 1122 | "x" 1123 | ] 1124 | }, 1125 | { 1126 | "cell_type": "code", 1127 | "execution_count": 25, 1128 | "id": "4b754402", 1129 | "metadata": { 1130 | "execution": { 1131 | "iopub.execute_input": "2022-11-05T08:25:32.040456Z", 1132 | "iopub.status.busy": "2022-11-05T08:25:32.040032Z", 1133 | "iopub.status.idle": "2022-11-05T08:25:32.067598Z", 1134 | "shell.execute_reply": "2022-11-05T08:25:32.066056Z" 1135 | }, 1136 | "papermill": { 1137 | "duration": 0.044743, 1138 | "end_time": "2022-11-05T08:25:32.070063", 1139 | "exception": false, 1140 | "start_time": "2022-11-05T08:25:32.025320", 1141 | "status": "completed" 1142 | }, 1143 | "tags": [] 1144 | }, 1145 | "outputs": [ 1146 | { 1147 | "data": { 1148 | "text/html": [ 1149 | "
LinearRegression()
In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.
" 1150 | ], 1151 | "text/plain": [ 1152 | "LinearRegression()" 1153 | ] 1154 | }, 1155 | "execution_count": 25, 1156 | "metadata": {}, 1157 | "output_type": "execute_result" 1158 | } 1159 | ], 1160 | "source": [ 1161 | "model_lr = LinearRegression()\n", 1162 | "model_lr.fit(x_train,y_train)" 1163 | ] 1164 | }, 1165 | { 1166 | "cell_type": "code", 1167 | "execution_count": 26, 1168 | "id": "4154b24a", 1169 | "metadata": { 1170 | "execution": { 1171 | "iopub.execute_input": "2022-11-05T08:25:32.099871Z", 1172 | "iopub.status.busy": "2022-11-05T08:25:32.099154Z", 1173 | "iopub.status.idle": "2022-11-05T08:25:32.108611Z", 1174 | "shell.execute_reply": "2022-11-05T08:25:32.107058Z" 1175 | }, 1176 | "papermill": { 1177 | "duration": 0.027656, 1178 | "end_time": "2022-11-05T08:25:32.111250", 1179 | "exception": false, 1180 | "start_time": "2022-11-05T08:25:32.083594", 1181 | "status": "completed" 1182 | }, 1183 | "tags": [] 1184 | }, 1185 | "outputs": [], 1186 | "source": [ 1187 | "predictions_lr = model_lr.predict(x_test)" 1188 | ] 1189 | }, 1190 | { 1191 | "cell_type": "code", 1192 | "execution_count": 27, 1193 | "id": "e7210f04", 1194 | "metadata": { 1195 | "execution": { 1196 | "iopub.execute_input": "2022-11-05T08:25:32.143266Z", 1197 | "iopub.status.busy": "2022-11-05T08:25:32.141898Z", 1198 | "iopub.status.idle": "2022-11-05T08:25:32.154013Z", 1199 | "shell.execute_reply": "2022-11-05T08:25:32.152405Z" 1200 | }, 1201 | "papermill": { 1202 | "duration": 0.03151, 1203 | "end_time": "2022-11-05T08:25:32.156761", 1204 | "exception": false, 1205 | "start_time": "2022-11-05T08:25:32.125251", 1206 | "status": "completed" 1207 | }, 1208 | "tags": [] 1209 | }, 1210 | "outputs": [ 1211 | { 1212 | "data": { 1213 | "text/plain": [ 1214 | "0.3183144703701215" 1215 | ] 1216 | }, 1217 | "execution_count": 27, 1218 | "metadata": {}, 1219 | "output_type": "execute_result" 1220 | } 1221 | ], 1222 | "source": [ 1223 | "mean_absolute_percentage_error(predictions_lr,y_test)" 1224 | ] 1225 | }, 1226 | { 1227 | "cell_type": "code", 1228 | "execution_count": 28, 1229 | "id": "ac1f2b3e", 1230 | "metadata": { 1231 | "execution": { 1232 | "iopub.execute_input": "2022-11-05T08:25:32.216071Z", 1233 | "iopub.status.busy": "2022-11-05T08:25:32.215312Z", 1234 | "iopub.status.idle": "2022-11-05T08:25:32.369227Z", 1235 | "shell.execute_reply": "2022-11-05T08:25:32.367811Z" 1236 | }, 1237 | "papermill": { 1238 | "duration": 0.172599, 1239 | "end_time": "2022-11-05T08:25:32.372327", 1240 | "exception": false, 1241 | "start_time": "2022-11-05T08:25:32.199728", 1242 | "status": "completed" 1243 | }, 1244 | "tags": [] 1245 | }, 1246 | "outputs": [], 1247 | "source": [ 1248 | "model = RandomForestRegressor(n_estimators=10)\n", 1249 | "model.fit(x_train,y_train)\n", 1250 | "predictions = model.predict(x_test)" 1251 | ] 1252 | }, 1253 | { 1254 | "cell_type": "code", 1255 | "execution_count": 29, 1256 | "id": "4bbf64d2", 1257 | "metadata": { 1258 | "execution": { 1259 | "iopub.execute_input": "2022-11-05T08:25:32.401682Z", 1260 | "iopub.status.busy": "2022-11-05T08:25:32.401256Z", 1261 | "iopub.status.idle": "2022-11-05T08:25:32.409150Z", 1262 | "shell.execute_reply": "2022-11-05T08:25:32.408030Z" 1263 | }, 1264 | "papermill": { 1265 | "duration": 0.025347, 1266 | "end_time": "2022-11-05T08:25:32.411577", 1267 | "exception": false, 1268 | "start_time": "2022-11-05T08:25:32.386230", 1269 | "status": "completed" 1270 | }, 1271 | "tags": [] 1272 | }, 1273 | "outputs": [ 1274 | { 1275 | "data": { 1276 | "text/plain": [ 1277 | "0.24210417557737207" 1278 | ] 1279 | }, 1280 | "execution_count": 29, 1281 | "metadata": {}, 1282 | "output_type": "execute_result" 1283 | } 1284 | ], 1285 | "source": [ 1286 | "mean_absolute_percentage_error(predictions,y_test)" 1287 | ] 1288 | }, 1289 | { 1290 | "cell_type": "code", 1291 | "execution_count": 32, 1292 | "id": "0a16e9cb", 1293 | "metadata": {}, 1294 | "outputs": [ 1295 | { 1296 | "data": { 1297 | "text/html": [ 1298 | "
\n", 1299 | "\n", 1312 | "\n", 1313 | " \n", 1314 | " \n", 1315 | " \n", 1316 | " \n", 1317 | " \n", 1318 | " \n", 1319 | " \n", 1320 | " \n", 1321 | " \n", 1322 | " \n", 1323 | " \n", 1324 | " \n", 1325 | " \n", 1326 | " \n", 1327 | " \n", 1328 | " \n", 1329 | " \n", 1330 | " \n", 1331 | " \n", 1332 | " \n", 1333 | " \n", 1334 | " \n", 1335 | " \n", 1336 | " \n", 1337 | " \n", 1338 | " \n", 1339 | " \n", 1340 | " \n", 1341 | " \n", 1342 | " \n", 1343 | " \n", 1344 | " \n", 1345 | " \n", 1346 | " \n", 1347 | " \n", 1348 | " \n", 1349 | " \n", 1350 | " \n", 1351 | " \n", 1352 | " \n", 1353 | " \n", 1354 | " \n", 1355 | " \n", 1356 | " \n", 1357 | " \n", 1358 | " \n", 1359 | " \n", 1360 | " \n", 1361 | " \n", 1362 | " \n", 1363 | " \n", 1364 | " \n", 1365 | " \n", 1366 | " \n", 1367 | " \n", 1368 | " \n", 1369 | " \n", 1370 | " \n", 1371 | " \n", 1372 | " \n", 1373 | " \n", 1374 | " \n", 1375 | " \n", 1376 | " \n", 1377 | " \n", 1378 | " \n", 1379 | " \n", 1380 | " \n", 1381 | " \n", 1382 | " \n", 1383 | " \n", 1384 | " \n", 1385 | " \n", 1386 | " \n", 1387 | " \n", 1388 | " \n", 1389 | "
pricebedroomsbathroomssqft_livingsqft_lotfloorsconditionsqft_abovecity_new
0313000311340791213134036
12384000523650905025337035
23420003219301194714193018
342000032200080301410003
45500004219401050014114031
\n", 1390 | "
" 1391 | ], 1392 | "text/plain": [ 1393 | " price bedrooms bathrooms sqft_living sqft_lot floors condition \\\n", 1394 | "0 313000 3 1 1340 7912 1 3 \n", 1395 | "1 2384000 5 2 3650 9050 2 5 \n", 1396 | "2 342000 3 2 1930 11947 1 4 \n", 1397 | "3 420000 3 2 2000 8030 1 4 \n", 1398 | "4 550000 4 2 1940 10500 1 4 \n", 1399 | "\n", 1400 | " sqft_above city_new \n", 1401 | "0 1340 36 \n", 1402 | "1 3370 35 \n", 1403 | "2 1930 18 \n", 1404 | "3 1000 3 \n", 1405 | "4 1140 31 " 1406 | ] 1407 | }, 1408 | "execution_count": 32, 1409 | "metadata": {}, 1410 | "output_type": "execute_result" 1411 | } 1412 | ], 1413 | "source": [ 1414 | "data.head()" 1415 | ] 1416 | }, 1417 | { 1418 | "cell_type": "code", 1419 | "execution_count": 33, 1420 | "id": "32b3dfde", 1421 | "metadata": { 1422 | "execution": { 1423 | "iopub.execute_input": "2022-11-05T08:25:32.495627Z", 1424 | "iopub.status.busy": "2022-11-05T08:25:32.495195Z", 1425 | "iopub.status.idle": "2022-11-05T08:25:32.504061Z", 1426 | "shell.execute_reply": "2022-11-05T08:25:32.503047Z" 1427 | }, 1428 | "papermill": { 1429 | "duration": 0.026607, 1430 | "end_time": "2022-11-05T08:25:32.506128", 1431 | "exception": false, 1432 | "start_time": "2022-11-05T08:25:32.479521", 1433 | "status": "completed" 1434 | }, 1435 | "tags": [] 1436 | }, 1437 | "outputs": [ 1438 | { 1439 | "data": { 1440 | "text/plain": [ 1441 | "array([284900.])" 1442 | ] 1443 | }, 1444 | "execution_count": 33, 1445 | "metadata": {}, 1446 | "output_type": "execute_result" 1447 | } 1448 | ], 1449 | "source": [ 1450 | "a = [1,1,200,200,1,2,200,36]\n", 1451 | "model.predict([a])" 1452 | ] 1453 | }, 1454 | { 1455 | "cell_type": "code", 1456 | "execution_count": 35, 1457 | "id": "76fa023e", 1458 | "metadata": {}, 1459 | "outputs": [ 1460 | { 1461 | "data": { 1462 | "text/plain": [ 1463 | "array([314950.])" 1464 | ] 1465 | }, 1466 | "execution_count": 35, 1467 | "metadata": {}, 1468 | "output_type": "execute_result" 1469 | } 1470 | ], 1471 | "source": [ 1472 | "b =[3,1,1340,7912,1,3,1340,36]\n", 1473 | "model.predict([b])" 1474 | ] 1475 | }, 1476 | { 1477 | "cell_type": "code", 1478 | "execution_count": null, 1479 | "id": "7b7c018b", 1480 | "metadata": {}, 1481 | "outputs": [], 1482 | "source": [] 1483 | } 1484 | ], 1485 | "metadata": { 1486 | "kernelspec": { 1487 | "display_name": "Python 3", 1488 | "language": "python", 1489 | "name": "python3" 1490 | }, 1491 | "language_info": { 1492 | "codemirror_mode": { 1493 | "name": "ipython", 1494 | "version": 3 1495 | }, 1496 | "file_extension": ".py", 1497 | "mimetype": "text/x-python", 1498 | "name": "python", 1499 | "nbconvert_exporter": "python", 1500 | "pygments_lexer": "ipython3", 1501 | "version": "3.10.0" 1502 | }, 1503 | "papermill": { 1504 | "default_parameters": {}, 1505 | "duration": 16.918623, 1506 | "end_time": "2022-11-05T08:25:33.493433", 1507 | "environment_variables": {}, 1508 | "exception": null, 1509 | "input_path": "__notebook__.ipynb", 1510 | "output_path": "__notebook__.ipynb", 1511 | "parameters": {}, 1512 | "start_time": "2022-11-05T08:25:16.574810", 1513 | "version": "2.3.4" 1514 | } 1515 | }, 1516 | "nbformat": 4, 1517 | "nbformat_minor": 5 1518 | } 1519 | -------------------------------------------------------------------------------- /pima-indians-diabetes-database-svm-accuracy-79.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "code", 5 | "execution_count": 1, 6 | "id": "149d2d1e", 7 | "metadata": { 8 | "execution": { 9 | "iopub.execute_input": "2023-05-17T05:30:26.966373Z", 10 | "iopub.status.busy": "2023-05-17T05:30:26.965827Z", 11 | "iopub.status.idle": "2023-05-17T05:30:28.438333Z", 12 | "shell.execute_reply": "2023-05-17T05:30:28.437064Z" 13 | }, 14 | "papermill": { 15 | "duration": 1.480344, 16 | "end_time": "2023-05-17T05:30:28.440911", 17 | "exception": false, 18 | "start_time": "2023-05-17T05:30:26.960567", 19 | "status": "completed" 20 | }, 21 | "tags": [] 22 | }, 23 | "outputs": [], 24 | "source": [ 25 | "import pandas as pd\n", 26 | "import numpy as np\n", 27 | "import matplotlib.pyplot as plt\n", 28 | "import sklearn \n", 29 | "from sklearn import svm\n", 30 | "from sklearn import metrics" 31 | ] 32 | }, 33 | { 34 | "cell_type": "code", 35 | "execution_count": 2, 36 | "id": "49a07ff9", 37 | "metadata": { 38 | "execution": { 39 | "iopub.execute_input": "2023-05-17T05:30:28.452774Z", 40 | "iopub.status.busy": "2023-05-17T05:30:28.452446Z", 41 | "iopub.status.idle": "2023-05-17T05:30:28.478510Z", 42 | "shell.execute_reply": "2023-05-17T05:30:28.477000Z" 43 | }, 44 | "papermill": { 45 | "duration": 0.03423, 46 | "end_time": "2023-05-17T05:30:28.481010", 47 | "exception": false, 48 | "start_time": "2023-05-17T05:30:28.446780", 49 | "status": "completed" 50 | }, 51 | "tags": [] 52 | }, 53 | "outputs": [], 54 | "source": [ 55 | "data = pd.read_csv(\"C:/Users/harin/Downloads/diabetes.csv\")" 56 | ] 57 | }, 58 | { 59 | "cell_type": "code", 60 | "execution_count": 3, 61 | "id": "e9fabbaf", 62 | "metadata": { 63 | "execution": { 64 | "iopub.execute_input": "2023-05-17T05:30:28.490963Z", 65 | "iopub.status.busy": "2023-05-17T05:30:28.490629Z", 66 | "iopub.status.idle": "2023-05-17T05:30:28.524254Z", 67 | "shell.execute_reply": "2023-05-17T05:30:28.523300Z" 68 | }, 69 | "papermill": { 70 | "duration": 0.041305, 71 | "end_time": "2023-05-17T05:30:28.526516", 72 | "exception": false, 73 | "start_time": "2023-05-17T05:30:28.485211", 74 | "status": "completed" 75 | }, 76 | "tags": [] 77 | }, 78 | "outputs": [ 79 | { 80 | "data": { 81 | "text/html": [ 82 | "
\n", 83 | "\n", 96 | "\n", 97 | " \n", 98 | " \n", 99 | " \n", 100 | " \n", 101 | " \n", 102 | " \n", 103 | " \n", 104 | " \n", 105 | " \n", 106 | " \n", 107 | " \n", 108 | " \n", 109 | " \n", 110 | " \n", 111 | " \n", 112 | " \n", 113 | " \n", 114 | " \n", 115 | " \n", 116 | " \n", 117 | " \n", 118 | " \n", 119 | " \n", 120 | " \n", 121 | " \n", 122 | " \n", 123 | " \n", 124 | " \n", 125 | " \n", 126 | " \n", 127 | " \n", 128 | " \n", 129 | " \n", 130 | " \n", 131 | " \n", 132 | " \n", 133 | " \n", 134 | " \n", 135 | " \n", 136 | " \n", 137 | " \n", 138 | " \n", 139 | " \n", 140 | " \n", 141 | " \n", 142 | " \n", 143 | " \n", 144 | " \n", 145 | " \n", 146 | " \n", 147 | " \n", 148 | " \n", 149 | " \n", 150 | " \n", 151 | " \n", 152 | " \n", 153 | " \n", 154 | " \n", 155 | " \n", 156 | " \n", 157 | " \n", 158 | " \n", 159 | " \n", 160 | " \n", 161 | " \n", 162 | " \n", 163 | " \n", 164 | " \n", 165 | " \n", 166 | " \n", 167 | " \n", 168 | " \n", 169 | " \n", 170 | " \n", 171 | " \n", 172 | " \n", 173 | " \n", 174 | " \n", 175 | " \n", 176 | " \n", 177 | " \n", 178 | " \n", 179 | " \n", 180 | " \n", 181 | " \n", 182 | " \n", 183 | " \n", 184 | " \n", 185 | " \n", 186 | " \n", 187 | " \n", 188 | " \n", 189 | " \n", 190 | " \n", 191 | " \n", 192 | " \n", 193 | " \n", 194 | " \n", 195 | " \n", 196 | " \n", 197 | " \n", 198 | " \n", 199 | " \n", 200 | " \n", 201 | " \n", 202 | " \n", 203 | " \n", 204 | " \n", 205 | " \n", 206 | " \n", 207 | " \n", 208 | " \n", 209 | " \n", 210 | " \n", 211 | " \n", 212 | " \n", 213 | " \n", 214 | " \n", 215 | " \n", 216 | " \n", 217 | " \n", 218 | " \n", 219 | " \n", 220 | " \n", 221 | " \n", 222 | " \n", 223 | " \n", 224 | " \n", 225 | " \n", 226 | " \n", 227 | " \n", 228 | " \n", 229 | " \n", 230 | " \n", 231 | " \n", 232 | " \n", 233 | "
PregnanciesGlucoseBloodPressureSkinThicknessInsulinBMIDiabetesPedigreeFunctionAgeOutcome
061487235033.60.627501
11856629026.60.351310
28183640023.30.672321
318966239428.10.167210
40137403516843.12.288331
55116740025.60.201300
637850328831.00.248261
71011500035.30.134290
82197704554330.50.158531
9812596000.00.232541
\n", 234 | "
" 235 | ], 236 | "text/plain": [ 237 | " Pregnancies Glucose BloodPressure SkinThickness Insulin BMI \\\n", 238 | "0 6 148 72 35 0 33.6 \n", 239 | "1 1 85 66 29 0 26.6 \n", 240 | "2 8 183 64 0 0 23.3 \n", 241 | "3 1 89 66 23 94 28.1 \n", 242 | "4 0 137 40 35 168 43.1 \n", 243 | "5 5 116 74 0 0 25.6 \n", 244 | "6 3 78 50 32 88 31.0 \n", 245 | "7 10 115 0 0 0 35.3 \n", 246 | "8 2 197 70 45 543 30.5 \n", 247 | "9 8 125 96 0 0 0.0 \n", 248 | "\n", 249 | " DiabetesPedigreeFunction Age Outcome \n", 250 | "0 0.627 50 1 \n", 251 | "1 0.351 31 0 \n", 252 | "2 0.672 32 1 \n", 253 | "3 0.167 21 0 \n", 254 | "4 2.288 33 1 \n", 255 | "5 0.201 30 0 \n", 256 | "6 0.248 26 1 \n", 257 | "7 0.134 29 0 \n", 258 | "8 0.158 53 1 \n", 259 | "9 0.232 54 1 " 260 | ] 261 | }, 262 | "execution_count": 3, 263 | "metadata": {}, 264 | "output_type": "execute_result" 265 | } 266 | ], 267 | "source": [ 268 | "data.head(10)" 269 | ] 270 | }, 271 | { 272 | "cell_type": "code", 273 | "execution_count": 5, 274 | "id": "abd6d66a", 275 | "metadata": { 276 | "execution": { 277 | "iopub.execute_input": "2023-05-17T05:30:28.609497Z", 278 | "iopub.status.busy": "2023-05-17T05:30:28.609183Z", 279 | "iopub.status.idle": "2023-05-17T05:30:28.616414Z", 280 | "shell.execute_reply": "2023-05-17T05:30:28.615121Z" 281 | }, 282 | "papermill": { 283 | "duration": 0.015147, 284 | "end_time": "2023-05-17T05:30:28.618308", 285 | "exception": false, 286 | "start_time": "2023-05-17T05:30:28.603161", 287 | "status": "completed" 288 | }, 289 | "tags": [] 290 | }, 291 | "outputs": [ 292 | { 293 | "data": { 294 | "text/plain": [ 295 | "(768, 9)" 296 | ] 297 | }, 298 | "execution_count": 5, 299 | "metadata": {}, 300 | "output_type": "execute_result" 301 | } 302 | ], 303 | "source": [ 304 | "data.shape" 305 | ] 306 | }, 307 | { 308 | "cell_type": "code", 309 | "execution_count": 6, 310 | "id": "bf342298", 311 | "metadata": { 312 | "execution": { 313 | "iopub.execute_input": "2023-05-17T05:30:28.629370Z", 314 | "iopub.status.busy": "2023-05-17T05:30:28.629046Z", 315 | "iopub.status.idle": "2023-05-17T05:30:28.663119Z", 316 | "shell.execute_reply": "2023-05-17T05:30:28.662087Z" 317 | }, 318 | "papermill": { 319 | "duration": 0.041756, 320 | "end_time": "2023-05-17T05:30:28.664927", 321 | "exception": false, 322 | "start_time": "2023-05-17T05:30:28.623171", 323 | "status": "completed" 324 | }, 325 | "tags": [] 326 | }, 327 | "outputs": [ 328 | { 329 | "data": { 330 | "text/html": [ 331 | "
\n", 332 | "\n", 345 | "\n", 346 | " \n", 347 | " \n", 348 | " \n", 349 | " \n", 350 | " \n", 351 | " \n", 352 | " \n", 353 | " \n", 354 | " \n", 355 | " \n", 356 | " \n", 357 | " \n", 358 | " \n", 359 | " \n", 360 | " \n", 361 | " \n", 362 | " \n", 363 | " \n", 364 | " \n", 365 | " \n", 366 | " \n", 367 | " \n", 368 | " \n", 369 | " \n", 370 | " \n", 371 | " \n", 372 | " \n", 373 | " \n", 374 | " \n", 375 | " \n", 376 | " \n", 377 | " \n", 378 | " \n", 379 | " \n", 380 | " \n", 381 | " \n", 382 | " \n", 383 | " \n", 384 | " \n", 385 | " \n", 386 | " \n", 387 | " \n", 388 | " \n", 389 | " \n", 390 | " \n", 391 | " \n", 392 | " \n", 393 | " \n", 394 | " \n", 395 | " \n", 396 | " \n", 397 | " \n", 398 | " \n", 399 | " \n", 400 | " \n", 401 | " \n", 402 | " \n", 403 | " \n", 404 | " \n", 405 | " \n", 406 | " \n", 407 | " \n", 408 | " \n", 409 | " \n", 410 | " \n", 411 | " \n", 412 | " \n", 413 | " \n", 414 | " \n", 415 | " \n", 416 | " \n", 417 | " \n", 418 | " \n", 419 | " \n", 420 | " \n", 421 | " \n", 422 | " \n", 423 | " \n", 424 | " \n", 425 | " \n", 426 | " \n", 427 | " \n", 428 | " \n", 429 | " \n", 430 | " \n", 431 | " \n", 432 | " \n", 433 | " \n", 434 | " \n", 435 | " \n", 436 | " \n", 437 | " \n", 438 | " \n", 439 | " \n", 440 | " \n", 441 | " \n", 442 | " \n", 443 | " \n", 444 | " \n", 445 | " \n", 446 | " \n", 447 | " \n", 448 | " \n", 449 | " \n", 450 | " \n", 451 | " \n", 452 | " \n", 453 | " \n", 454 | " \n", 455 | " \n", 456 | " \n", 457 | " \n", 458 | "
PregnanciesGlucoseBloodPressureSkinThicknessInsulinBMIDiabetesPedigreeFunctionAgeOutcome
count768.000000768.000000768.000000768.000000768.000000768.000000768.000000768.000000768.000000
mean3.845052120.89453169.10546920.53645879.79947931.9925780.47187633.2408850.348958
std3.36957831.97261819.35580715.952218115.2440027.8841600.33132911.7602320.476951
min0.0000000.0000000.0000000.0000000.0000000.0000000.07800021.0000000.000000
25%1.00000099.00000062.0000000.0000000.00000027.3000000.24375024.0000000.000000
50%3.000000117.00000072.00000023.00000030.50000032.0000000.37250029.0000000.000000
75%6.000000140.25000080.00000032.000000127.25000036.6000000.62625041.0000001.000000
max17.000000199.000000122.00000099.000000846.00000067.1000002.42000081.0000001.000000
\n", 459 | "
" 460 | ], 461 | "text/plain": [ 462 | " Pregnancies Glucose BloodPressure SkinThickness Insulin \\\n", 463 | "count 768.000000 768.000000 768.000000 768.000000 768.000000 \n", 464 | "mean 3.845052 120.894531 69.105469 20.536458 79.799479 \n", 465 | "std 3.369578 31.972618 19.355807 15.952218 115.244002 \n", 466 | "min 0.000000 0.000000 0.000000 0.000000 0.000000 \n", 467 | "25% 1.000000 99.000000 62.000000 0.000000 0.000000 \n", 468 | "50% 3.000000 117.000000 72.000000 23.000000 30.500000 \n", 469 | "75% 6.000000 140.250000 80.000000 32.000000 127.250000 \n", 470 | "max 17.000000 199.000000 122.000000 99.000000 846.000000 \n", 471 | "\n", 472 | " BMI DiabetesPedigreeFunction Age Outcome \n", 473 | "count 768.000000 768.000000 768.000000 768.000000 \n", 474 | "mean 31.992578 0.471876 33.240885 0.348958 \n", 475 | "std 7.884160 0.331329 11.760232 0.476951 \n", 476 | "min 0.000000 0.078000 21.000000 0.000000 \n", 477 | "25% 27.300000 0.243750 24.000000 0.000000 \n", 478 | "50% 32.000000 0.372500 29.000000 0.000000 \n", 479 | "75% 36.600000 0.626250 41.000000 1.000000 \n", 480 | "max 67.100000 2.420000 81.000000 1.000000 " 481 | ] 482 | }, 483 | "execution_count": 6, 484 | "metadata": {}, 485 | "output_type": "execute_result" 486 | } 487 | ], 488 | "source": [ 489 | "data.describe()" 490 | ] 491 | }, 492 | { 493 | "cell_type": "code", 494 | "execution_count": 7, 495 | "id": "ce6226fb", 496 | "metadata": { 497 | "execution": { 498 | "iopub.execute_input": "2023-05-17T05:30:28.677344Z", 499 | "iopub.status.busy": "2023-05-17T05:30:28.675884Z", 500 | "iopub.status.idle": "2023-05-17T05:30:28.688803Z", 501 | "shell.execute_reply": "2023-05-17T05:30:28.686983Z" 502 | }, 503 | "papermill": { 504 | "duration": 0.021206, 505 | "end_time": "2023-05-17T05:30:28.691089", 506 | "exception": false, 507 | "start_time": "2023-05-17T05:30:28.669883", 508 | "status": "completed" 509 | }, 510 | "tags": [] 511 | }, 512 | "outputs": [], 513 | "source": [ 514 | "label = data[[\"Outcome\"]]" 515 | ] 516 | }, 517 | { 518 | "cell_type": "code", 519 | "execution_count": 8, 520 | "id": "d3ee4364", 521 | "metadata": { 522 | "execution": { 523 | "iopub.execute_input": "2023-05-17T05:30:28.702419Z", 524 | "iopub.status.busy": "2023-05-17T05:30:28.702124Z", 525 | "iopub.status.idle": "2023-05-17T05:30:28.707547Z", 526 | "shell.execute_reply": "2023-05-17T05:30:28.706698Z" 527 | }, 528 | "papermill": { 529 | "duration": 0.013589, 530 | "end_time": "2023-05-17T05:30:28.709617", 531 | "exception": false, 532 | "start_time": "2023-05-17T05:30:28.696028", 533 | "status": "completed" 534 | }, 535 | "tags": [] 536 | }, 537 | "outputs": [], 538 | "source": [ 539 | "feature = data.drop(data[['Outcome',\"Age\",\"SkinThickness\",\"Pregnancies\"]],axis=1)" 540 | ] 541 | }, 542 | { 543 | "cell_type": "code", 544 | "execution_count": 9, 545 | "id": "2ce00ebd", 546 | "metadata": { 547 | "execution": { 548 | "iopub.execute_input": "2023-05-17T05:30:28.720429Z", 549 | "iopub.status.busy": "2023-05-17T05:30:28.720118Z", 550 | "iopub.status.idle": "2023-05-17T05:30:28.732930Z", 551 | "shell.execute_reply": "2023-05-17T05:30:28.731499Z" 552 | }, 553 | "papermill": { 554 | "duration": 0.021368, 555 | "end_time": "2023-05-17T05:30:28.735697", 556 | "exception": false, 557 | "start_time": "2023-05-17T05:30:28.714329", 558 | "status": "completed" 559 | }, 560 | "tags": [] 561 | }, 562 | "outputs": [ 563 | { 564 | "data": { 565 | "text/html": [ 566 | "
\n", 567 | "\n", 580 | "\n", 581 | " \n", 582 | " \n", 583 | " \n", 584 | " \n", 585 | " \n", 586 | " \n", 587 | " \n", 588 | " \n", 589 | " \n", 590 | " \n", 591 | " \n", 592 | " \n", 593 | " \n", 594 | " \n", 595 | " \n", 596 | " \n", 597 | " \n", 598 | " \n", 599 | " \n", 600 | " \n", 601 | " \n", 602 | " \n", 603 | " \n", 604 | " \n", 605 | " \n", 606 | " \n", 607 | " \n", 608 | " \n", 609 | " \n", 610 | " \n", 611 | " \n", 612 | " \n", 613 | " \n", 614 | " \n", 615 | " \n", 616 | " \n", 617 | " \n", 618 | " \n", 619 | " \n", 620 | " \n", 621 | " \n", 622 | " \n", 623 | " \n", 624 | " \n", 625 | " \n", 626 | " \n", 627 | " \n", 628 | " \n", 629 | " \n", 630 | " \n", 631 | " \n", 632 | " \n", 633 | " \n", 634 | " \n", 635 | " \n", 636 | " \n", 637 | " \n", 638 | " \n", 639 | " \n", 640 | " \n", 641 | " \n", 642 | " \n", 643 | " \n", 644 | " \n", 645 | " \n", 646 | " \n", 647 | " \n", 648 | " \n", 649 | " \n", 650 | " \n", 651 | " \n", 652 | " \n", 653 | " \n", 654 | " \n", 655 | " \n", 656 | " \n", 657 | " \n", 658 | " \n", 659 | " \n", 660 | " \n", 661 | " \n", 662 | " \n", 663 | " \n", 664 | " \n", 665 | " \n", 666 | " \n", 667 | " \n", 668 | " \n", 669 | " \n", 670 | " \n", 671 | " \n", 672 | " \n", 673 | " \n", 674 | " \n", 675 | " \n", 676 | " \n", 677 | " \n", 678 | " \n", 679 | " \n", 680 | " \n", 681 | "
GlucoseBloodPressureInsulinBMIDiabetesPedigreeFunction
014872033.60.627
18566026.60.351
218364023.30.672
389669428.10.167
41374016843.12.288
..................
7631017618032.90.171
76412270036.80.340
7651217211226.20.245
76612660030.10.349
7679370030.40.315
\n", 682 | "

768 rows × 5 columns

\n", 683 | "
" 684 | ], 685 | "text/plain": [ 686 | " Glucose BloodPressure Insulin BMI DiabetesPedigreeFunction\n", 687 | "0 148 72 0 33.6 0.627\n", 688 | "1 85 66 0 26.6 0.351\n", 689 | "2 183 64 0 23.3 0.672\n", 690 | "3 89 66 94 28.1 0.167\n", 691 | "4 137 40 168 43.1 2.288\n", 692 | ".. ... ... ... ... ...\n", 693 | "763 101 76 180 32.9 0.171\n", 694 | "764 122 70 0 36.8 0.340\n", 695 | "765 121 72 112 26.2 0.245\n", 696 | "766 126 60 0 30.1 0.349\n", 697 | "767 93 70 0 30.4 0.315\n", 698 | "\n", 699 | "[768 rows x 5 columns]" 700 | ] 701 | }, 702 | "execution_count": 9, 703 | "metadata": {}, 704 | "output_type": "execute_result" 705 | } 706 | ], 707 | "source": [ 708 | "feature" 709 | ] 710 | }, 711 | { 712 | "cell_type": "code", 713 | "execution_count": 10, 714 | "id": "8f76abae", 715 | "metadata": { 716 | "execution": { 717 | "iopub.execute_input": "2023-05-17T05:30:28.747604Z", 718 | "iopub.status.busy": "2023-05-17T05:30:28.747263Z", 719 | "iopub.status.idle": "2023-05-17T05:30:28.752607Z", 720 | "shell.execute_reply": "2023-05-17T05:30:28.751452Z" 721 | }, 722 | "papermill": { 723 | "duration": 0.013865, 724 | "end_time": "2023-05-17T05:30:28.754867", 725 | "exception": false, 726 | "start_time": "2023-05-17T05:30:28.741002", 727 | "status": "completed" 728 | }, 729 | "tags": [] 730 | }, 731 | "outputs": [], 732 | "source": [ 733 | "data['BMI'] = data['BMI'].astype(\"int\")" 734 | ] 735 | }, 736 | { 737 | "cell_type": "code", 738 | "execution_count": 11, 739 | "id": "831d83b6", 740 | "metadata": { 741 | "execution": { 742 | "iopub.execute_input": "2023-05-17T05:30:28.766969Z", 743 | "iopub.status.busy": "2023-05-17T05:30:28.766669Z", 744 | "iopub.status.idle": "2023-05-17T05:30:34.068993Z", 745 | "shell.execute_reply": "2023-05-17T05:30:34.067738Z" 746 | }, 747 | "papermill": { 748 | "duration": 5.310809, 749 | "end_time": "2023-05-17T05:30:34.071057", 750 | "exception": false, 751 | "start_time": "2023-05-17T05:30:28.760248", 752 | "status": "completed" 753 | }, 754 | "tags": [] 755 | }, 756 | "outputs": [ 757 | { 758 | "name": "stderr", 759 | "output_type": "stream", 760 | "text": [ 761 | "c:\\Users\\harin\\AppData\\Local\\Programs\\Python\\Python310\\lib\\site-packages\\sklearn\\utils\\validation.py:1143: DataConversionWarning: A column-vector y was passed when a 1d array was expected. Please change the shape of y to (n_samples, ), for example using ravel().\n", 762 | " y = column_or_1d(y, warn=True)\n" 763 | ] 764 | }, 765 | { 766 | "name": "stdout", 767 | "output_type": "stream", 768 | "text": [ 769 | "The accuracy of kernel: linear is 80%\n", 770 | "The accuracy of kernel: rbf is 77%\n", 771 | "The accuracy of kernel: poly is 75%\n" 772 | ] 773 | }, 774 | { 775 | "name": "stderr", 776 | "output_type": "stream", 777 | "text": [ 778 | "c:\\Users\\harin\\AppData\\Local\\Programs\\Python\\Python310\\lib\\site-packages\\sklearn\\utils\\validation.py:1143: DataConversionWarning: A column-vector y was passed when a 1d array was expected. Please change the shape of y to (n_samples, ), for example using ravel().\n", 779 | " y = column_or_1d(y, warn=True)\n", 780 | "c:\\Users\\harin\\AppData\\Local\\Programs\\Python\\Python310\\lib\\site-packages\\sklearn\\utils\\validation.py:1143: DataConversionWarning: A column-vector y was passed when a 1d array was expected. Please change the shape of y to (n_samples, ), for example using ravel().\n", 781 | " y = column_or_1d(y, warn=True)\n" 782 | ] 783 | } 784 | ], 785 | "source": [ 786 | "li = []\n", 787 | "kernels = [\"linear\",\"rbf\",\"poly\"]\n", 788 | "for i in range(0,len(kernels)):\n", 789 | " model = svm.SVC(kernel=kernels[i])\n", 790 | " x_train,x_test,y_train,y_test = sklearn.model_selection.train_test_split(feature,label,test_size=0.2)\n", 791 | " model.fit(x_train,y_train)\n", 792 | " prediction = model.predict(x_test)\n", 793 | " accuracy = metrics.accuracy_score(y_test,prediction)\n", 794 | " print(f\"The accuracy of kernel: {kernels[i]} is {int(accuracy*100)}%\")\n", 795 | " \n", 796 | " #li.append(accuracy)\n", 797 | "#print(\"Average Accuracy is:\",f\"{int(np.mean(li)*100)}%\")" 798 | ] 799 | }, 800 | { 801 | "cell_type": "code", 802 | "execution_count": 12, 803 | "id": "70fef5f2", 804 | "metadata": { 805 | "execution": { 806 | "iopub.execute_input": "2023-05-17T05:30:34.092791Z", 807 | "iopub.status.busy": "2023-05-17T05:30:34.092474Z", 808 | "iopub.status.idle": "2023-05-17T05:32:37.351981Z", 809 | "shell.execute_reply": "2023-05-17T05:32:37.351110Z" 810 | }, 811 | "papermill": { 812 | "duration": 123.273413, 813 | "end_time": "2023-05-17T05:32:37.359547", 814 | "exception": false, 815 | "start_time": "2023-05-17T05:30:34.086134", 816 | "status": "completed" 817 | }, 818 | "tags": [] 819 | }, 820 | "outputs": [ 821 | { 822 | "name": "stderr", 823 | "output_type": "stream", 824 | "text": [ 825 | "c:\\Users\\harin\\AppData\\Local\\Programs\\Python\\Python310\\lib\\site-packages\\sklearn\\utils\\validation.py:1143: DataConversionWarning: A column-vector y was passed when a 1d array was expected. Please change the shape of y to (n_samples, ), for example using ravel().\n", 826 | " y = column_or_1d(y, warn=True)\n" 827 | ] 828 | }, 829 | { 830 | "name": "stdout", 831 | "output_type": "stream", 832 | "text": [ 833 | "The accuracy of kernel: Linear is 74% C: 1\n" 834 | ] 835 | }, 836 | { 837 | "name": "stderr", 838 | "output_type": "stream", 839 | "text": [ 840 | "c:\\Users\\harin\\AppData\\Local\\Programs\\Python\\Python310\\lib\\site-packages\\sklearn\\utils\\validation.py:1143: DataConversionWarning: A column-vector y was passed when a 1d array was expected. Please change the shape of y to (n_samples, ), for example using ravel().\n", 841 | " y = column_or_1d(y, warn=True)\n" 842 | ] 843 | }, 844 | { 845 | "name": "stdout", 846 | "output_type": "stream", 847 | "text": [ 848 | "The accuracy of kernel: Linear is 77% C: 2\n" 849 | ] 850 | }, 851 | { 852 | "name": "stderr", 853 | "output_type": "stream", 854 | "text": [ 855 | "c:\\Users\\harin\\AppData\\Local\\Programs\\Python\\Python310\\lib\\site-packages\\sklearn\\utils\\validation.py:1143: DataConversionWarning: A column-vector y was passed when a 1d array was expected. Please change the shape of y to (n_samples, ), for example using ravel().\n", 856 | " y = column_or_1d(y, warn=True)\n" 857 | ] 858 | }, 859 | { 860 | "name": "stdout", 861 | "output_type": "stream", 862 | "text": [ 863 | "The accuracy of kernel: Linear is 75% C: 3\n" 864 | ] 865 | }, 866 | { 867 | "name": "stderr", 868 | "output_type": "stream", 869 | "text": [ 870 | "c:\\Users\\harin\\AppData\\Local\\Programs\\Python\\Python310\\lib\\site-packages\\sklearn\\utils\\validation.py:1143: DataConversionWarning: A column-vector y was passed when a 1d array was expected. Please change the shape of y to (n_samples, ), for example using ravel().\n", 871 | " y = column_or_1d(y, warn=True)\n" 872 | ] 873 | }, 874 | { 875 | "name": "stdout", 876 | "output_type": "stream", 877 | "text": [ 878 | "The accuracy of kernel: Linear is 77% C: 4\n" 879 | ] 880 | }, 881 | { 882 | "name": "stderr", 883 | "output_type": "stream", 884 | "text": [ 885 | "c:\\Users\\harin\\AppData\\Local\\Programs\\Python\\Python310\\lib\\site-packages\\sklearn\\utils\\validation.py:1143: DataConversionWarning: A column-vector y was passed when a 1d array was expected. Please change the shape of y to (n_samples, ), for example using ravel().\n", 886 | " y = column_or_1d(y, warn=True)\n" 887 | ] 888 | }, 889 | { 890 | "name": "stdout", 891 | "output_type": "stream", 892 | "text": [ 893 | "The accuracy of kernel: Linear is 78% C: 5\n" 894 | ] 895 | }, 896 | { 897 | "name": "stderr", 898 | "output_type": "stream", 899 | "text": [ 900 | "c:\\Users\\harin\\AppData\\Local\\Programs\\Python\\Python310\\lib\\site-packages\\sklearn\\utils\\validation.py:1143: DataConversionWarning: A column-vector y was passed when a 1d array was expected. Please change the shape of y to (n_samples, ), for example using ravel().\n", 901 | " y = column_or_1d(y, warn=True)\n" 902 | ] 903 | } 904 | ], 905 | "source": [ 906 | "for i in range(1,10):\n", 907 | " model = svm.SVC(kernel=\"linear\",C=i)\n", 908 | " x_train,x_test,y_train,y_test = sklearn.model_selection.train_test_split(feature,label,test_size=0.2)\n", 909 | " model.fit(x_train,y_train)\n", 910 | " prediction = model.predict(x_test)\n", 911 | " accuracy = metrics.accuracy_score(y_test,prediction)\n", 912 | " print(f\"The accuracy of kernel: Linear is {int(accuracy*100)}% C: {i}\")" 913 | ] 914 | } 915 | ], 916 | "metadata": { 917 | "kernelspec": { 918 | "display_name": "Python 3", 919 | "language": "python", 920 | "name": "python3" 921 | }, 922 | "language_info": { 923 | "codemirror_mode": { 924 | "name": "ipython", 925 | "version": 3 926 | }, 927 | "file_extension": ".py", 928 | "mimetype": "text/x-python", 929 | "name": "python", 930 | "nbconvert_exporter": "python", 931 | "pygments_lexer": "ipython3", 932 | "version": "3.10.0" 933 | }, 934 | "papermill": { 935 | "default_parameters": {}, 936 | "duration": 142.857483, 937 | "end_time": "2023-05-17T05:32:38.300466", 938 | "environment_variables": {}, 939 | "exception": null, 940 | "input_path": "__notebook__.ipynb", 941 | "output_path": "__notebook__.ipynb", 942 | "parameters": {}, 943 | "start_time": "2023-05-17T05:30:15.442983", 944 | "version": "2.4.0" 945 | } 946 | }, 947 | "nbformat": 4, 948 | "nbformat_minor": 5 949 | } 950 | -------------------------------------------------------------------------------- /winequality-prediction.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "code", 5 | "execution_count": 3, 6 | "id": "a9c11110", 7 | "metadata": { 8 | "execution": { 9 | "iopub.execute_input": "2023-08-07T07:07:49.414411Z", 10 | "iopub.status.busy": "2023-08-07T07:07:49.413913Z", 11 | "iopub.status.idle": "2023-08-07T07:07:49.426948Z", 12 | "shell.execute_reply": "2023-08-07T07:07:49.425982Z" 13 | }, 14 | "papermill": { 15 | "duration": 0.023536, 16 | "end_time": "2023-08-07T07:07:49.429167", 17 | "exception": false, 18 | "start_time": "2023-08-07T07:07:49.405631", 19 | "status": "completed" 20 | }, 21 | "tags": [] 22 | }, 23 | "outputs": [], 24 | "source": [ 25 | "import pandas as pd\n", 26 | "import numpy as np\n", 27 | "import matplotlib.pyplot as plt\n", 28 | "%matplotlib inline" 29 | ] 30 | }, 31 | { 32 | "cell_type": "code", 33 | "execution_count": 4, 34 | "id": "8431d5c0", 35 | "metadata": { 36 | "execution": { 37 | "iopub.execute_input": "2023-08-07T07:07:49.441953Z", 38 | "iopub.status.busy": "2023-08-07T07:07:49.441587Z", 39 | "iopub.status.idle": "2023-08-07T07:07:49.499514Z", 40 | "shell.execute_reply": "2023-08-07T07:07:49.498507Z" 41 | }, 42 | "papermill": { 43 | "duration": 0.066537, 44 | "end_time": "2023-08-07T07:07:49.501606", 45 | "exception": false, 46 | "start_time": "2023-08-07T07:07:49.435069", 47 | "status": "completed" 48 | }, 49 | "tags": [] 50 | }, 51 | "outputs": [ 52 | { 53 | "data": { 54 | "text/html": [ 55 | "
\n", 56 | "\n", 69 | "\n", 70 | " \n", 71 | " \n", 72 | " \n", 73 | " \n", 74 | " \n", 75 | " \n", 76 | " \n", 77 | " \n", 78 | " \n", 79 | " \n", 80 | " \n", 81 | " \n", 82 | " \n", 83 | " \n", 84 | " \n", 85 | " \n", 86 | " \n", 87 | " \n", 88 | " \n", 89 | " \n", 90 | " \n", 91 | " \n", 92 | " \n", 93 | " \n", 94 | " \n", 95 | " \n", 96 | " \n", 97 | " \n", 98 | " \n", 99 | " \n", 100 | " \n", 101 | " \n", 102 | " \n", 103 | " \n", 104 | " \n", 105 | " \n", 106 | " \n", 107 | " \n", 108 | " \n", 109 | " \n", 110 | " \n", 111 | " \n", 112 | " \n", 113 | " \n", 114 | " \n", 115 | " \n", 116 | " \n", 117 | " \n", 118 | " \n", 119 | " \n", 120 | " \n", 121 | " \n", 122 | " \n", 123 | " \n", 124 | " \n", 125 | " \n", 126 | " \n", 127 | " \n", 128 | " \n", 129 | " \n", 130 | " \n", 131 | " \n", 132 | " \n", 133 | " \n", 134 | " \n", 135 | " \n", 136 | " \n", 137 | " \n", 138 | " \n", 139 | " \n", 140 | " \n", 141 | " \n", 142 | " \n", 143 | " \n", 144 | " \n", 145 | " \n", 146 | " \n", 147 | " \n", 148 | " \n", 149 | " \n", 150 | " \n", 151 | " \n", 152 | " \n", 153 | " \n", 154 | " \n", 155 | " \n", 156 | " \n", 157 | " \n", 158 | " \n", 159 | " \n", 160 | " \n", 161 | " \n", 162 | " \n", 163 | " \n", 164 | " \n", 165 | " \n", 166 | " \n", 167 | " \n", 168 | " \n", 169 | " \n", 170 | " \n", 171 | " \n", 172 | " \n", 173 | " \n", 174 | " \n", 175 | " \n", 176 | " \n", 177 | " \n", 178 | " \n", 179 | " \n", 180 | " \n", 181 | " \n", 182 | " \n", 183 | " \n", 184 | " \n", 185 | " \n", 186 | " \n", 187 | " \n", 188 | " \n", 189 | " \n", 190 | " \n", 191 | " \n", 192 | " \n", 193 | " \n", 194 | " \n", 195 | " \n", 196 | " \n", 197 | " \n", 198 | " \n", 199 | " \n", 200 | " \n", 201 | " \n", 202 | " \n", 203 | " \n", 204 | " \n", 205 | " \n", 206 | " \n", 207 | " \n", 208 | " \n", 209 | " \n", 210 | " \n", 211 | " \n", 212 | " \n", 213 | " \n", 214 | " \n", 215 | " \n", 216 | " \n", 217 | " \n", 218 | " \n", 219 | " \n", 220 | " \n", 221 | " \n", 222 | " \n", 223 | " \n", 224 | " \n", 225 | " \n", 226 | " \n", 227 | " \n", 228 | " \n", 229 | " \n", 230 | " \n", 231 | " \n", 232 | " \n", 233 | " \n", 234 | " \n", 235 | " \n", 236 | " \n", 237 | " \n", 238 | " \n", 239 | " \n", 240 | " \n", 241 | " \n", 242 | " \n", 243 | " \n", 244 | " \n", 245 | " \n", 246 | " \n", 247 | " \n", 248 | " \n", 249 | " \n", 250 | " \n", 251 | " \n", 252 | " \n", 253 | " \n", 254 | "
fixed acidityvolatile aciditycitric acidresidual sugarchloridesfree sulfur dioxidetotal sulfur dioxidedensitypHsulphatesalcoholquality
07.40.7000.001.90.07611.034.00.997803.510.569.45
17.80.8800.002.60.09825.067.00.996803.200.689.85
27.80.7600.042.30.09215.054.00.997003.260.659.85
311.20.2800.561.90.07517.060.00.998003.160.589.86
47.40.7000.001.90.07611.034.00.997803.510.569.45
.......................................
15946.20.6000.082.00.09032.044.00.994903.450.5810.55
15955.90.5500.102.20.06239.051.00.995123.520.7611.26
15966.30.5100.132.30.07629.040.00.995743.420.7511.06
15975.90.6450.122.00.07532.044.00.995473.570.7110.25
15986.00.3100.473.60.06718.042.00.995493.390.6611.06
\n", 255 | "

1599 rows × 12 columns

\n", 256 | "
" 257 | ], 258 | "text/plain": [ 259 | " fixed acidity volatile acidity citric acid residual sugar chlorides \\\n", 260 | "0 7.4 0.700 0.00 1.9 0.076 \n", 261 | "1 7.8 0.880 0.00 2.6 0.098 \n", 262 | "2 7.8 0.760 0.04 2.3 0.092 \n", 263 | "3 11.2 0.280 0.56 1.9 0.075 \n", 264 | "4 7.4 0.700 0.00 1.9 0.076 \n", 265 | "... ... ... ... ... ... \n", 266 | "1594 6.2 0.600 0.08 2.0 0.090 \n", 267 | "1595 5.9 0.550 0.10 2.2 0.062 \n", 268 | "1596 6.3 0.510 0.13 2.3 0.076 \n", 269 | "1597 5.9 0.645 0.12 2.0 0.075 \n", 270 | "1598 6.0 0.310 0.47 3.6 0.067 \n", 271 | "\n", 272 | " free sulfur dioxide total sulfur dioxide density pH sulphates \\\n", 273 | "0 11.0 34.0 0.99780 3.51 0.56 \n", 274 | "1 25.0 67.0 0.99680 3.20 0.68 \n", 275 | "2 15.0 54.0 0.99700 3.26 0.65 \n", 276 | "3 17.0 60.0 0.99800 3.16 0.58 \n", 277 | "4 11.0 34.0 0.99780 3.51 0.56 \n", 278 | "... ... ... ... ... ... \n", 279 | "1594 32.0 44.0 0.99490 3.45 0.58 \n", 280 | "1595 39.0 51.0 0.99512 3.52 0.76 \n", 281 | "1596 29.0 40.0 0.99574 3.42 0.75 \n", 282 | "1597 32.0 44.0 0.99547 3.57 0.71 \n", 283 | "1598 18.0 42.0 0.99549 3.39 0.66 \n", 284 | "\n", 285 | " alcohol quality \n", 286 | "0 9.4 5 \n", 287 | "1 9.8 5 \n", 288 | "2 9.8 5 \n", 289 | "3 9.8 6 \n", 290 | "4 9.4 5 \n", 291 | "... ... ... \n", 292 | "1594 10.5 5 \n", 293 | "1595 11.2 6 \n", 294 | "1596 11.0 6 \n", 295 | "1597 10.2 5 \n", 296 | "1598 11.0 6 \n", 297 | "\n", 298 | "[1599 rows x 12 columns]" 299 | ] 300 | }, 301 | "execution_count": 4, 302 | "metadata": {}, 303 | "output_type": "execute_result" 304 | } 305 | ], 306 | "source": [ 307 | "df= pd.read_csv(\"C:/Users/User/Downloads/winequality-red.csv\")\n", 308 | "df" 309 | ] 310 | }, 311 | { 312 | "cell_type": "code", 313 | "execution_count": 5, 314 | "id": "7bab339d", 315 | "metadata": { 316 | "execution": { 317 | "iopub.execute_input": "2023-08-07T07:07:49.514590Z", 318 | "iopub.status.busy": "2023-08-07T07:07:49.514173Z", 319 | "iopub.status.idle": "2023-08-07T07:07:49.544718Z", 320 | "shell.execute_reply": "2023-08-07T07:07:49.543381Z" 321 | }, 322 | "papermill": { 323 | "duration": 0.03933, 324 | "end_time": "2023-08-07T07:07:49.546661", 325 | "exception": false, 326 | "start_time": "2023-08-07T07:07:49.507331", 327 | "status": "completed" 328 | }, 329 | "tags": [] 330 | }, 331 | "outputs": [ 332 | { 333 | "data": { 334 | "text/html": [ 335 | "
\n", 336 | "\n", 349 | "\n", 350 | " \n", 351 | " \n", 352 | " \n", 353 | " \n", 354 | " \n", 355 | " \n", 356 | " \n", 357 | " \n", 358 | " \n", 359 | " \n", 360 | " \n", 361 | " \n", 362 | " \n", 363 | " \n", 364 | " \n", 365 | " \n", 366 | " \n", 367 | " \n", 368 | " \n", 369 | " \n", 370 | " \n", 371 | " \n", 372 | " \n", 373 | " \n", 374 | " \n", 375 | " \n", 376 | " \n", 377 | " \n", 378 | " \n", 379 | " \n", 380 | " \n", 381 | " \n", 382 | " \n", 383 | " \n", 384 | " \n", 385 | " \n", 386 | " \n", 387 | " \n", 388 | " \n", 389 | " \n", 390 | " \n", 391 | " \n", 392 | " \n", 393 | " \n", 394 | " \n", 395 | " \n", 396 | " \n", 397 | " \n", 398 | " \n", 399 | " \n", 400 | " \n", 401 | " \n", 402 | " \n", 403 | " \n", 404 | " \n", 405 | " \n", 406 | " \n", 407 | " \n", 408 | " \n", 409 | " \n", 410 | " \n", 411 | " \n", 412 | " \n", 413 | " \n", 414 | " \n", 415 | " \n", 416 | " \n", 417 | " \n", 418 | " \n", 419 | " \n", 420 | " \n", 421 | " \n", 422 | " \n", 423 | " \n", 424 | " \n", 425 | " \n", 426 | " \n", 427 | " \n", 428 | " \n", 429 | " \n", 430 | " \n", 431 | " \n", 432 | " \n", 433 | " \n", 434 | " \n", 435 | " \n", 436 | " \n", 437 | " \n", 438 | " \n", 439 | " \n", 440 | " \n", 441 | " \n", 442 | " \n", 443 | " \n", 444 | " \n", 445 | " \n", 446 | " \n", 447 | " \n", 448 | " \n", 449 | " \n", 450 | " \n", 451 | " \n", 452 | " \n", 453 | " \n", 454 | " \n", 455 | " \n", 456 | " \n", 457 | " \n", 458 | " \n", 459 | " \n", 460 | " \n", 461 | " \n", 462 | " \n", 463 | " \n", 464 | " \n", 465 | " \n", 466 | " \n", 467 | " \n", 468 | " \n", 469 | " \n", 470 | " \n", 471 | " \n", 472 | " \n", 473 | " \n", 474 | " \n", 475 | " \n", 476 | " \n", 477 | " \n", 478 | " \n", 479 | " \n", 480 | " \n", 481 | " \n", 482 | " \n", 483 | " \n", 484 | " \n", 485 | " \n", 486 | " \n", 487 | " \n", 488 | " \n", 489 | " \n", 490 | " \n", 491 | " \n", 492 | " \n", 493 | " \n", 494 | " \n", 495 | " \n", 496 | " \n", 497 | " \n", 498 | " \n", 499 | " \n", 500 | " \n", 501 | " \n", 502 | " \n", 503 | " \n", 504 | " \n", 505 | " \n", 506 | " \n", 507 | " \n", 508 | " \n", 509 | " \n", 510 | " \n", 511 | " \n", 512 | " \n", 513 | " \n", 514 | " \n", 515 | " \n", 516 | " \n", 517 | " \n", 518 | " \n", 519 | " \n", 520 | " \n", 521 | " \n", 522 | "
fixed acidityvolatile aciditycitric acidresidual sugarchloridesfree sulfur dioxidetotal sulfur dioxidedensitypHsulphatesalcohol
07.40.7000.001.90.07611.034.00.997803.510.569.4
17.80.8800.002.60.09825.067.00.996803.200.689.8
27.80.7600.042.30.09215.054.00.997003.260.659.8
311.20.2800.561.90.07517.060.00.998003.160.589.8
47.40.7000.001.90.07611.034.00.997803.510.569.4
....................................
15946.20.6000.082.00.09032.044.00.994903.450.5810.5
15955.90.5500.102.20.06239.051.00.995123.520.7611.2
15966.30.5100.132.30.07629.040.00.995743.420.7511.0
15975.90.6450.122.00.07532.044.00.995473.570.7110.2
15986.00.3100.473.60.06718.042.00.995493.390.6611.0
\n", 523 | "

1599 rows × 11 columns

\n", 524 | "
" 525 | ], 526 | "text/plain": [ 527 | " fixed acidity volatile acidity citric acid residual sugar chlorides \\\n", 528 | "0 7.4 0.700 0.00 1.9 0.076 \n", 529 | "1 7.8 0.880 0.00 2.6 0.098 \n", 530 | "2 7.8 0.760 0.04 2.3 0.092 \n", 531 | "3 11.2 0.280 0.56 1.9 0.075 \n", 532 | "4 7.4 0.700 0.00 1.9 0.076 \n", 533 | "... ... ... ... ... ... \n", 534 | "1594 6.2 0.600 0.08 2.0 0.090 \n", 535 | "1595 5.9 0.550 0.10 2.2 0.062 \n", 536 | "1596 6.3 0.510 0.13 2.3 0.076 \n", 537 | "1597 5.9 0.645 0.12 2.0 0.075 \n", 538 | "1598 6.0 0.310 0.47 3.6 0.067 \n", 539 | "\n", 540 | " free sulfur dioxide total sulfur dioxide density pH sulphates \\\n", 541 | "0 11.0 34.0 0.99780 3.51 0.56 \n", 542 | "1 25.0 67.0 0.99680 3.20 0.68 \n", 543 | "2 15.0 54.0 0.99700 3.26 0.65 \n", 544 | "3 17.0 60.0 0.99800 3.16 0.58 \n", 545 | "4 11.0 34.0 0.99780 3.51 0.56 \n", 546 | "... ... ... ... ... ... \n", 547 | "1594 32.0 44.0 0.99490 3.45 0.58 \n", 548 | "1595 39.0 51.0 0.99512 3.52 0.76 \n", 549 | "1596 29.0 40.0 0.99574 3.42 0.75 \n", 550 | "1597 32.0 44.0 0.99547 3.57 0.71 \n", 551 | "1598 18.0 42.0 0.99549 3.39 0.66 \n", 552 | "\n", 553 | " alcohol \n", 554 | "0 9.4 \n", 555 | "1 9.8 \n", 556 | "2 9.8 \n", 557 | "3 9.8 \n", 558 | "4 9.4 \n", 559 | "... ... \n", 560 | "1594 10.5 \n", 561 | "1595 11.2 \n", 562 | "1596 11.0 \n", 563 | "1597 10.2 \n", 564 | "1598 11.0 \n", 565 | "\n", 566 | "[1599 rows x 11 columns]" 567 | ] 568 | }, 569 | "execution_count": 5, 570 | "metadata": {}, 571 | "output_type": "execute_result" 572 | } 573 | ], 574 | "source": [ 575 | "#splitting input and output features\n", 576 | "X=df.drop(\"quality\",axis=1)\n", 577 | "Y=df[\"quality\"]\n", 578 | "X\n" 579 | ] 580 | }, 581 | { 582 | "cell_type": "code", 583 | "execution_count": 6, 584 | "id": "37c1eedc", 585 | "metadata": { 586 | "execution": { 587 | "iopub.execute_input": "2023-08-07T07:07:49.560673Z", 588 | "iopub.status.busy": "2023-08-07T07:07:49.560279Z", 589 | "iopub.status.idle": "2023-08-07T07:07:49.567578Z", 590 | "shell.execute_reply": "2023-08-07T07:07:49.566745Z" 591 | }, 592 | "papermill": { 593 | "duration": 0.016584, 594 | "end_time": "2023-08-07T07:07:49.569561", 595 | "exception": false, 596 | "start_time": "2023-08-07T07:07:49.552977", 597 | "status": "completed" 598 | }, 599 | "tags": [] 600 | }, 601 | "outputs": [ 602 | { 603 | "data": { 604 | "text/plain": [ 605 | "0 5\n", 606 | "1 5\n", 607 | "2 5\n", 608 | "3 6\n", 609 | "4 5\n", 610 | " ..\n", 611 | "1594 5\n", 612 | "1595 6\n", 613 | "1596 6\n", 614 | "1597 5\n", 615 | "1598 6\n", 616 | "Name: quality, Length: 1599, dtype: int64" 617 | ] 618 | }, 619 | "execution_count": 6, 620 | "metadata": {}, 621 | "output_type": "execute_result" 622 | } 623 | ], 624 | "source": [ 625 | "Y" 626 | ] 627 | }, 628 | { 629 | "cell_type": "code", 630 | "execution_count": 7, 631 | "id": "22c404f5", 632 | "metadata": { 633 | "execution": { 634 | "iopub.execute_input": "2023-08-07T07:07:49.584536Z", 635 | "iopub.status.busy": "2023-08-07T07:07:49.583774Z", 636 | "iopub.status.idle": "2023-08-07T07:07:50.921198Z", 637 | "shell.execute_reply": "2023-08-07T07:07:50.919600Z" 638 | }, 639 | "papermill": { 640 | "duration": 1.348708, 641 | "end_time": "2023-08-07T07:07:50.924625", 642 | "exception": false, 643 | "start_time": "2023-08-07T07:07:49.575917", 644 | "status": "completed" 645 | }, 646 | "tags": [] 647 | }, 648 | "outputs": [], 649 | "source": [ 650 | "#splitting the data into training and testing sets (70% training and 30% testing)\n", 651 | "from sklearn.model_selection import train_test_split,cross_val_score\n", 652 | "X_train,X_test,Y_train,Y_test=train_test_split(X,Y,test_size=0.3,random_state=42)\n" 653 | ] 654 | }, 655 | { 656 | "cell_type": "code", 657 | "execution_count": 8, 658 | "id": "3610bf65", 659 | "metadata": { 660 | "execution": { 661 | "iopub.execute_input": "2023-08-07T07:07:50.941093Z", 662 | "iopub.status.busy": "2023-08-07T07:07:50.940199Z", 663 | "iopub.status.idle": "2023-08-07T07:07:50.947492Z", 664 | "shell.execute_reply": "2023-08-07T07:07:50.946150Z" 665 | }, 666 | "papermill": { 667 | "duration": 0.018691, 668 | "end_time": "2023-08-07T07:07:50.950277", 669 | "exception": false, 670 | "start_time": "2023-08-07T07:07:50.931586", 671 | "status": "completed" 672 | }, 673 | "tags": [] 674 | }, 675 | "outputs": [ 676 | { 677 | "name": "stdout", 678 | "output_type": "stream", 679 | "text": [ 680 | "Shape of X_train: (1119, 11)\n", 681 | "Shape of X_test: (480, 11)\n", 682 | "Shape of Y_train: (1119,)\n", 683 | "Shape of Y_test: (480,)\n" 684 | ] 685 | } 686 | ], 687 | "source": [ 688 | "import numpy as np\n", 689 | "\n", 690 | "# Assuming you have split the data into X_train, X_test, y_train, y_test\n", 691 | "print(\"Shape of X_train:\", X_train.shape)\n", 692 | "print(\"Shape of X_test:\", X_test.shape)\n", 693 | "print(\"Shape of Y_train:\", Y_train.shape)\n", 694 | "print(\"Shape of Y_test:\", Y_test.shape)" 695 | ] 696 | }, 697 | { 698 | "cell_type": "code", 699 | "execution_count": 9, 700 | "id": "bae513aa", 701 | "metadata": { 702 | "execution": { 703 | "iopub.execute_input": "2023-08-07T07:07:50.966761Z", 704 | "iopub.status.busy": "2023-08-07T07:07:50.966234Z", 705 | "iopub.status.idle": "2023-08-07T07:07:51.130001Z", 706 | "shell.execute_reply": "2023-08-07T07:07:51.128498Z" 707 | }, 708 | "papermill": { 709 | "duration": 0.176061, 710 | "end_time": "2023-08-07T07:07:51.133273", 711 | "exception": false, 712 | "start_time": "2023-08-07T07:07:50.957212", 713 | "status": "completed" 714 | }, 715 | "tags": [] 716 | }, 717 | "outputs": [ 718 | { 719 | "data": { 720 | "text/html": [ 721 | "
LinearRegression()
In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.
" 722 | ], 723 | "text/plain": [ 724 | "LinearRegression()" 725 | ] 726 | }, 727 | "execution_count": 9, 728 | "metadata": {}, 729 | "output_type": "execute_result" 730 | } 731 | ], 732 | "source": [ 733 | "#creating LogisticRegression model\n", 734 | "from sklearn.linear_model import LinearRegression\n", 735 | "model = LinearRegression()\n", 736 | "\n", 737 | "#train the model using training data\n", 738 | "model.fit(X_train,Y_train)" 739 | ] 740 | }, 741 | { 742 | "cell_type": "code", 743 | "execution_count": 10, 744 | "id": "ebde7927", 745 | "metadata": { 746 | "execution": { 747 | "iopub.execute_input": "2023-08-07T07:07:51.162479Z", 748 | "iopub.status.busy": "2023-08-07T07:07:51.161422Z", 749 | "iopub.status.idle": "2023-08-07T07:07:51.172331Z", 750 | "shell.execute_reply": "2023-08-07T07:07:51.171039Z" 751 | }, 752 | "papermill": { 753 | "duration": 0.032875, 754 | "end_time": "2023-08-07T07:07:51.177836", 755 | "exception": false, 756 | "start_time": "2023-08-07T07:07:51.144961", 757 | "status": "completed" 758 | }, 759 | "tags": [] 760 | }, 761 | "outputs": [], 762 | "source": [ 763 | "#make predictions on train data\n", 764 | "\n", 765 | "train_pred=model.predict(X_train)\n", 766 | "#train_pred=train_pred.astype(int)" 767 | ] 768 | }, 769 | { 770 | "cell_type": "code", 771 | "execution_count": 11, 772 | "id": "a97b86a7", 773 | "metadata": { 774 | "execution": { 775 | "iopub.execute_input": "2023-08-07T07:07:51.265837Z", 776 | "iopub.status.busy": "2023-08-07T07:07:51.265163Z", 777 | "iopub.status.idle": "2023-08-07T07:07:51.282683Z", 778 | "shell.execute_reply": "2023-08-07T07:07:51.281095Z" 779 | }, 780 | "papermill": { 781 | "duration": 0.035588, 782 | "end_time": "2023-08-07T07:07:51.286915", 783 | "exception": false, 784 | "start_time": "2023-08-07T07:07:51.251327", 785 | "status": "completed" 786 | }, 787 | "tags": [] 788 | }, 789 | "outputs": [ 790 | { 791 | "name": "stdout", 792 | "output_type": "stream", 793 | "text": [ 794 | "MAE: 0.49518748493865494\n", 795 | "RMSE: 0.6486806989670354\n", 796 | "R-Squared: 0.36119824413213175\n" 797 | ] 798 | } 799 | ], 800 | "source": [ 801 | "from sklearn import metrics\n", 802 | "\n", 803 | "# evaluating the model on the training data\n", 804 | "\n", 805 | "print(\"MAE:\",metrics.mean_absolute_error(Y_train,train_pred))\n", 806 | "print(\"RMSE:\",np.sqrt(metrics.mean_squared_error(Y_train,train_pred)))\n", 807 | "print(\"R-Squared:\",metrics.r2_score(Y_train,train_pred))" 808 | ] 809 | }, 810 | { 811 | "cell_type": "code", 812 | "execution_count": 12, 813 | "id": "8a002e4e", 814 | "metadata": { 815 | "execution": { 816 | "iopub.execute_input": "2023-08-07T07:07:51.305107Z", 817 | "iopub.status.busy": "2023-08-07T07:07:51.304634Z", 818 | "iopub.status.idle": "2023-08-07T07:07:51.312423Z", 819 | "shell.execute_reply": "2023-08-07T07:07:51.311247Z" 820 | }, 821 | "papermill": { 822 | "duration": 0.018979, 823 | "end_time": "2023-08-07T07:07:51.314834", 824 | "exception": false, 825 | "start_time": "2023-08-07T07:07:51.295855", 826 | "status": "completed" 827 | }, 828 | "tags": [] 829 | }, 830 | "outputs": [], 831 | "source": [ 832 | "# Make predictions on test data\n", 833 | "\n", 834 | "test_pred = model.predict(X_test)" 835 | ] 836 | }, 837 | { 838 | "cell_type": "code", 839 | "execution_count": 13, 840 | "id": "1630eb92", 841 | "metadata": { 842 | "execution": { 843 | "iopub.execute_input": "2023-08-07T07:07:51.331995Z", 844 | "iopub.status.busy": "2023-08-07T07:07:51.331108Z", 845 | "iopub.status.idle": "2023-08-07T07:07:51.339214Z", 846 | "shell.execute_reply": "2023-08-07T07:07:51.337915Z" 847 | }, 848 | "papermill": { 849 | "duration": 0.019394, 850 | "end_time": "2023-08-07T07:07:51.341607", 851 | "exception": false, 852 | "start_time": "2023-08-07T07:07:51.322213", 853 | "status": "completed" 854 | }, 855 | "tags": [] 856 | }, 857 | "outputs": [ 858 | { 859 | "name": "stdout", 860 | "output_type": "stream", 861 | "text": [ 862 | "MAE: 0.513395608245112\n", 863 | "RMSE: 0.6412759715991394\n", 864 | "R-Squared: 0.3513885332505232\n" 865 | ] 866 | } 867 | ], 868 | "source": [ 869 | "# evaluating the model on the testing data\n", 870 | "\n", 871 | "print(\"MAE:\",metrics.mean_absolute_error(Y_test,test_pred))\n", 872 | "print(\"RMSE:\",np.sqrt(metrics.mean_squared_error(Y_test,test_pred)))\n", 873 | "print(\"R-Squared:\",metrics.r2_score(Y_test,test_pred))" 874 | ] 875 | }, 876 | { 877 | "cell_type": "code", 878 | "execution_count": 14, 879 | "id": "ceda0c78", 880 | "metadata": { 881 | "execution": { 882 | "iopub.execute_input": "2023-08-07T07:07:51.386950Z", 883 | "iopub.status.busy": "2023-08-07T07:07:51.386011Z", 884 | "iopub.status.idle": "2023-08-07T07:07:51.444225Z", 885 | "shell.execute_reply": "2023-08-07T07:07:51.442615Z" 886 | }, 887 | "papermill": { 888 | "duration": 0.070712, 889 | "end_time": "2023-08-07T07:07:51.447748", 890 | "exception": false, 891 | "start_time": "2023-08-07T07:07:51.377036", 892 | "status": "completed" 893 | }, 894 | "tags": [] 895 | }, 896 | "outputs": [ 897 | { 898 | "name": "stdout", 899 | "output_type": "stream", 900 | "text": [ 901 | "The r2 using 5-fold cross-validation on training data: 0.334985992062552\n" 902 | ] 903 | } 904 | ], 905 | "source": [ 906 | "# Perform k-fold cross-validation on the training data \n", 907 | "\n", 908 | "from sklearn.model_selection import cross_val_score\n", 909 | "\n", 910 | "r2_cv_scores = cross_val_score(model,X_train,Y_train,cv=5,scoring='r2')\n", 911 | "mean_r2train_cv = r2_cv_scores.mean()\n", 912 | "print(\"The r2 using 5-fold cross-validation on training data:\", mean_r2train_cv)\n" 913 | ] 914 | }, 915 | { 916 | "cell_type": "code", 917 | "execution_count": 15, 918 | "id": "eade077a", 919 | "metadata": { 920 | "execution": { 921 | "iopub.execute_input": "2023-08-07T07:07:51.483401Z", 922 | "iopub.status.busy": "2023-08-07T07:07:51.482683Z", 923 | "iopub.status.idle": "2023-08-07T07:07:51.556137Z", 924 | "shell.execute_reply": "2023-08-07T07:07:51.554781Z" 925 | }, 926 | "papermill": { 927 | "duration": 0.094352, 928 | "end_time": "2023-08-07T07:07:51.559680", 929 | "exception": false, 930 | "start_time": "2023-08-07T07:07:51.465328", 931 | "status": "completed" 932 | }, 933 | "tags": [] 934 | }, 935 | "outputs": [ 936 | { 937 | "name": "stdout", 938 | "output_type": "stream", 939 | "text": [ 940 | "The r2 using 5-fold cross-validation on testing data: 0.326678061098226\n" 941 | ] 942 | } 943 | ], 944 | "source": [ 945 | "# Perform k-fold cross-validation on the testing data \n", 946 | "\n", 947 | "r2test_cv_scores = cross_val_score(model,X_test,Y_test,cv=5,scoring='r2')\n", 948 | "mean_r2test_cv= r2test_cv_scores.mean()\n", 949 | "print(\"The r2 using 5-fold cross-validation on testing data:\", mean_r2test_cv)\n" 950 | ] 951 | }, 952 | { 953 | "cell_type": "code", 954 | "execution_count": 16, 955 | "id": "f2e8f598", 956 | "metadata": { 957 | "execution": { 958 | "iopub.execute_input": "2023-08-07T07:07:51.591703Z", 959 | "iopub.status.busy": "2023-08-07T07:07:51.591246Z", 960 | "iopub.status.idle": "2023-08-07T07:07:51.644925Z", 961 | "shell.execute_reply": "2023-08-07T07:07:51.643797Z" 962 | }, 963 | "papermill": { 964 | "duration": 0.06555, 965 | "end_time": "2023-08-07T07:07:51.648211", 966 | "exception": false, 967 | "start_time": "2023-08-07T07:07:51.582661", 968 | "status": "completed" 969 | }, 970 | "tags": [] 971 | }, 972 | "outputs": [ 973 | { 974 | "name": "stdout", 975 | "output_type": "stream", 976 | "text": [ 977 | "The mean squared error using 5-fold cross-validation on training data: -0.43652212341343855\n" 978 | ] 979 | } 980 | ], 981 | "source": [ 982 | "# Perform k-fold cross-validation on the training data \n", 983 | "msetrain_cv_scores = cross_val_score(model,X_train,Y_train,cv=5,scoring='neg_mean_squared_error')\n", 984 | "mean_msetrain_cv = msetrain_cv_scores.mean()\n", 985 | "print(\"The mean squared error using 5-fold cross-validation on training data:\", mean_msetrain_cv)" 986 | ] 987 | }, 988 | { 989 | "cell_type": "code", 990 | "execution_count": 17, 991 | "id": "d8eca687", 992 | "metadata": { 993 | "execution": { 994 | "iopub.execute_input": "2023-08-07T07:07:51.675607Z", 995 | "iopub.status.busy": "2023-08-07T07:07:51.674949Z", 996 | "iopub.status.idle": "2023-08-07T07:07:51.721929Z", 997 | "shell.execute_reply": "2023-08-07T07:07:51.720700Z" 998 | }, 999 | "papermill": { 1000 | "duration": 0.064823, 1001 | "end_time": "2023-08-07T07:07:51.725314", 1002 | "exception": false, 1003 | "start_time": "2023-08-07T07:07:51.660491", 1004 | "status": "completed" 1005 | }, 1006 | "tags": [] 1007 | }, 1008 | "outputs": [ 1009 | { 1010 | "name": "stdout", 1011 | "output_type": "stream", 1012 | "text": [ 1013 | "The mean squared error using 5-fold cross-validation on testing data: -0.4235962818050936\n" 1014 | ] 1015 | } 1016 | ], 1017 | "source": [ 1018 | "# Perform k-fold cross-validation on the training data \n", 1019 | "msetest_cv_scores = cross_val_score(model,X_test,Y_test,cv=5,scoring='neg_mean_squared_error')\n", 1020 | "mean_msetest_cv = msetest_cv_scores.mean()\n", 1021 | "print(\"The mean squared error using 5-fold cross-validation on testing data:\", mean_msetest_cv)" 1022 | ] 1023 | }, 1024 | { 1025 | "cell_type": "code", 1026 | "execution_count": 18, 1027 | "id": "f2be066f", 1028 | "metadata": { 1029 | "execution": { 1030 | "iopub.execute_input": "2023-08-07T07:07:51.782441Z", 1031 | "iopub.status.busy": "2023-08-07T07:07:51.781493Z", 1032 | "iopub.status.idle": "2023-08-07T07:07:51.836107Z", 1033 | "shell.execute_reply": "2023-08-07T07:07:51.834934Z" 1034 | }, 1035 | "papermill": { 1036 | "duration": 0.067354, 1037 | "end_time": "2023-08-07T07:07:51.839451", 1038 | "exception": false, 1039 | "start_time": "2023-08-07T07:07:51.772097", 1040 | "status": "completed" 1041 | }, 1042 | "tags": [] 1043 | }, 1044 | "outputs": [ 1045 | { 1046 | "name": "stdout", 1047 | "output_type": "stream", 1048 | "text": [ 1049 | "The root mean squared error using 5-fold cross-validation on training data: -0.6592628863743302\n" 1050 | ] 1051 | } 1052 | ], 1053 | "source": [ 1054 | "rmsetrain_cv_scores = cross_val_score(model,X_train,Y_train,cv=5,scoring='neg_root_mean_squared_error')\n", 1055 | "mean_rmsetrain_cv= rmsetrain_cv_scores.mean()\n", 1056 | "print(\"The root mean squared error using 5-fold cross-validation on training data:\", mean_rmsetrain_cv)\n" 1057 | ] 1058 | }, 1059 | { 1060 | "cell_type": "code", 1061 | "execution_count": 19, 1062 | "id": "aaeadaf6", 1063 | "metadata": { 1064 | "execution": { 1065 | "iopub.execute_input": "2023-08-07T07:07:51.867554Z", 1066 | "iopub.status.busy": "2023-08-07T07:07:51.866990Z", 1067 | "iopub.status.idle": "2023-08-07T07:07:51.917291Z", 1068 | "shell.execute_reply": "2023-08-07T07:07:51.915704Z" 1069 | }, 1070 | "papermill": { 1071 | "duration": 0.06848, 1072 | "end_time": "2023-08-07T07:07:51.920600", 1073 | "exception": false, 1074 | "start_time": "2023-08-07T07:07:51.852120", 1075 | "status": "completed" 1076 | }, 1077 | "tags": [] 1078 | }, 1079 | "outputs": [ 1080 | { 1081 | "name": "stdout", 1082 | "output_type": "stream", 1083 | "text": [ 1084 | "The root mean squared error using 5-fold cross-validation on testing data: -0.6496133904328669\n" 1085 | ] 1086 | } 1087 | ], 1088 | "source": [ 1089 | "rmsetest_cv_scores = cross_val_score(model,X_test,Y_test,cv=5,scoring='neg_root_mean_squared_error')\n", 1090 | "mean_rmsetest_cv= rmsetest_cv_scores.mean()\n", 1091 | "print(\"The root mean squared error using 5-fold cross-validation on testing data:\", mean_rmsetest_cv)\n" 1092 | ] 1093 | } 1094 | ], 1095 | "metadata": { 1096 | "kernelspec": { 1097 | "display_name": "Python 3", 1098 | "language": "python", 1099 | "name": "python3" 1100 | }, 1101 | "language_info": { 1102 | "codemirror_mode": { 1103 | "name": "ipython", 1104 | "version": 3 1105 | }, 1106 | "file_extension": ".py", 1107 | "mimetype": "text/x-python", 1108 | "name": "python", 1109 | "nbconvert_exporter": "python", 1110 | "pygments_lexer": "ipython3", 1111 | "version": "3.10.0" 1112 | }, 1113 | "papermill": { 1114 | "default_parameters": {}, 1115 | "duration": 13.529599, 1116 | "end_time": "2023-08-07T07:07:52.877766", 1117 | "environment_variables": {}, 1118 | "exception": null, 1119 | "input_path": "__notebook__.ipynb", 1120 | "output_path": "__notebook__.ipynb", 1121 | "parameters": {}, 1122 | "start_time": "2023-08-07T07:07:39.348167", 1123 | "version": "2.4.0" 1124 | } 1125 | }, 1126 | "nbformat": 4, 1127 | "nbformat_minor": 5 1128 | } 1129 | --------------------------------------------------------------------------------