├── .gitignore ├── LICENSE ├── README.md ├── Week 2 - Linear Regression ├── Multi Variable Linear Regression.ipynb ├── One Variable Linear Regression.ipynb ├── ex1data1.csv ├── ex1data2.csv └── img │ ├── alpha_cost.JPG │ ├── h.JPG │ ├── j.JPG │ ├── jmult.JPG │ ├── jmult_p.JPG │ ├── normal.JPG │ └── thta.JPG ├── Week 3 - Logistic Regression ├── Logistic Regression.ipynb ├── Regularized Logistic Regression.ipynb ├── ex2data1.csv ├── ex2data2.csv └── img │ ├── fit.JPG │ ├── gradient.JPG │ ├── gradient_reg.JPG │ ├── gradient_reg_.JPG │ ├── j.JPG │ ├── j_reg.JPG │ ├── lr-h.JPG │ ├── map_feature.JPG │ └── sigmoid.JPG ├── Week 4 - Multi-Class Classification and Neural Networks ├── Multi-Class Classification.ipynb ├── Neural Networks.ipynb ├── ex3data1.mat ├── ex3weights.mat └── img │ ├── bx.JPG │ ├── fullgrad.JPG │ ├── grad.JPG │ ├── h-y.JPG │ ├── j.JPG │ ├── nn.JPG │ ├── plot.JPG │ ├── x.JPG │ ├── xandtheta.JPG │ └── xtheta.JPG ├── Week 5 - Neural Networks Learning ├── Backpropagation.ipynb ├── Neural Networks.ipynb ├── ex4data1.mat ├── ex4weights.mat └── img │ ├── acc_grad.JPG │ ├── backprop.JPG │ ├── delta.JPG │ ├── dj.JPG │ ├── fi.JPG │ ├── full_grad.JPG │ ├── g_grad.JPG │ ├── grad_reg.JPG │ ├── hidden_backprop.JPG │ ├── j_reg.JPG │ ├── nn.JPG │ ├── plot.JPG │ ├── sig.JPG │ ├── theta_dif.JPG │ ├── x.JPG │ └── y.JPG └── Week 6 - Regularized Linear Regression and Bias v.s. Variance ├── Polynomial Regression.ipynb ├── Regularized Linear Regression.ipynb ├── Xtest.csv ├── Xval.csv ├── ex5data1.mat ├── img ├── jtrain.JPG ├── poly.JPG ├── rlrc.JPG └── rlrg.JPG ├── ytest.csv └── yval.csv /.gitignore: -------------------------------------------------------------------------------- 1 | # Byte-compiled / optimized / DLL files 2 | __pycache__/ 3 | *.py[cod] 4 | *$py.class 5 | 6 | # C extensions 7 | *.so 8 | 9 | # Distribution / packaging 10 | .Python 11 | build/ 12 | develop-eggs/ 13 | dist/ 14 | downloads/ 15 | eggs/ 16 | .eggs/ 17 | lib/ 18 | lib64/ 19 | parts/ 20 | sdist/ 21 | var/ 22 | wheels/ 23 | *.egg-info/ 24 | .installed.cfg 25 | *.egg 26 | MANIFEST 27 | 28 | # PyInstaller 29 | # Usually these files are written by a python script from a template 30 | # before PyInstaller builds the exe, so as to inject date/other infos into it. 31 | *.manifest 32 | *.spec 33 | 34 | # Installer logs 35 | pip-log.txt 36 | pip-delete-this-directory.txt 37 | 38 | # Unit test / coverage reports 39 | htmlcov/ 40 | .tox/ 41 | .coverage 42 | .coverage.* 43 | .cache 44 | nosetests.xml 45 | coverage.xml 46 | *.cover 47 | .hypothesis/ 48 | .pytest_cache/ 49 | 50 | # Translations 51 | *.mo 52 | *.pot 53 | 54 | # Django stuff: 55 | *.log 56 | local_settings.py 57 | db.sqlite3 58 | 59 | # Flask stuff: 60 | instance/ 61 | .webassets-cache 62 | 63 | # Scrapy stuff: 64 | .scrapy 65 | 66 | # Sphinx documentation 67 | docs/_build/ 68 | 69 | # PyBuilder 70 | target/ 71 | 72 | # Jupyter Notebook 73 | .ipynb_checkpoints 74 | 75 | # pyenv 76 | .python-version 77 | 78 | # celery beat schedule file 79 | celerybeat-schedule 80 | 81 | # SageMath parsed files 82 | *.sage.py 83 | 84 | # Environments 85 | .env 86 | .venv 87 | env/ 88 | venv/ 89 | ENV/ 90 | env.bak/ 91 | venv.bak/ 92 | 93 | # Spyder project settings 94 | .spyderproject 95 | .spyproject 96 | 97 | # Rope project settings 98 | .ropeproject 99 | 100 | # mkdocs documentation 101 | /site 102 | 103 | # mypy 104 | .mypy_cache/ 105 | 106 | # .csv generated from .mat 107 | X.csv 108 | y.csv 109 | Theta1.csv 110 | Theta2.csv -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- 1 | MIT License 2 | 3 | Copyright (c) 2018 M. Doosti Lakhani 4 | 5 | Permission is hereby granted, free of charge, to any person obtaining a copy 6 | of this software and associated documentation files (the "Software"), to deal 7 | in the Software without restriction, including without limitation the rights 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 9 | copies of the Software, and to permit persons to whom the Software is 10 | furnished to do so, subject to the following conditions: 11 | 12 | The above copyright notice and this permission notice shall be included in all 13 | copies or substantial portions of the Software. 14 | 15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 21 | SOFTWARE. 22 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | # [NO LONGER DEVELOPED] Coursera Machine Learning by Andrew Ng 2 | In this repository I implemented few assignments in python. (No octave to python library) 3 | 4 | # Acknowledgement 5 | I started learning python by learning machine learning at the same time and I may have a lot of inefficient/ugly/... codes here. 6 | There are lots of good repos out there for this coarse, please use them. 7 | 8 | # Features 9 | 1. All optional exercises have been done 10 | 2. All computations done in vectorized form 11 | 12 | # Schedule 13 | - [x] Week 2 - Linear Regression
14 | - [x] Linear Regression With One Variable 15 | - [x] Linear Regression With Multiple Variable 16 | - [x] Week 3 - Logistic Regression
17 | - [x] Logistic Regression 18 | - [x] Regularized Logistic Regression 19 | - [x] Week 4 - Multi-Class Classification and Neural Networks
20 | - [x] Multi-class Classification 21 | - [x] Neural Networks 22 | - [x] Trying Different Parameters 23 | - [x] Week 5 - Neural Networks Learning 24 | - [x] Neural Networks 25 | - [x] Backpropagation [#3](https://github.com/Nikronic/Coursera-Machine-Learning/issues/3) 26 | - [x] Trying Different Parameters 27 | - [ ] Week 6 - Regularized Linear Regression and Bias v.s. Variance 28 | - [x] Regularized Linear Regression 29 | - [ ] Bias-Variance 30 | - [ ] Polynomial Regression 31 | 32 | # Reference 33 | Coursera Machine Learning course by Andrew Ng. 34 | -------------------------------------------------------------------------------- /Week 2 - Linear Regression/ex1data1.csv: -------------------------------------------------------------------------------- 1 | 6.1101,17.592 2 | 5.5277,9.1302 3 | 8.5186,13.662 4 | 7.0032,11.854 5 | 5.8598,6.8233 6 | 8.3829,11.886 7 | 7.4764,4.3483 8 | 8.5781,12 9 | 6.4862,6.5987 10 | 5.0546,3.8166 11 | 5.7107,3.2522 12 | 14.164,15.505 13 | 5.734,3.1551 14 | 8.4084,7.2258 15 | 5.6407,0.71618 16 | 5.3794,3.5129 17 | 6.3654,5.3048 18 | 5.1301,0.56077 19 | 6.4296,3.6518 20 | 7.0708,5.3893 21 | 6.1891,3.1386 22 | 20.27,21.767 23 | 5.4901,4.263 24 | 6.3261,5.1875 25 | 5.5649,3.0825 26 | 18.945,22.638 27 | 12.828,13.501 28 | 10.957,7.0467 29 | 13.176,14.692 30 | 22.203,24.147 31 | 5.2524,-1.22 32 | 6.5894,5.9966 33 | 9.2482,12.134 34 | 5.8918,1.8495 35 | 8.2111,6.5426 36 | 7.9334,4.5623 37 | 8.0959,4.1164 38 | 5.6063,3.3928 39 | 12.836,10.117 40 | 6.3534,5.4974 41 | 5.4069,0.55657 42 | 6.8825,3.9115 43 | 11.708,5.3854 44 | 5.7737,2.4406 45 | 7.8247,6.7318 46 | 7.0931,1.0463 47 | 5.0702,5.1337 48 | 5.8014,1.844 49 | 11.7,8.0043 50 | 5.5416,1.0179 51 | 7.5402,6.7504 52 | 5.3077,1.8396 53 | 7.4239,4.2885 54 | 7.6031,4.9981 55 | 6.3328,1.4233 56 | 6.3589,-1.4211 57 | 6.2742,2.4756 58 | 5.6397,4.6042 59 | 9.3102,3.9624 60 | 9.4536,5.4141 61 | 8.8254,5.1694 62 | 5.1793,-0.74279 63 | 21.279,17.929 64 | 14.908,12.054 65 | 18.959,17.054 66 | 7.2182,4.8852 67 | 8.2951,5.7442 68 | 10.236,7.7754 69 | 5.4994,1.0173 70 | 20.341,20.992 71 | 10.136,6.6799 72 | 7.3345,4.0259 73 | 6.0062,1.2784 74 | 7.2259,3.3411 75 | 5.0269,-2.6807 76 | 6.5479,0.29678 77 | 7.5386,3.8845 78 | 5.0365,5.7014 79 | 10.274,6.7526 80 | 5.1077,2.0576 81 | 5.7292,0.47953 82 | 5.1884,0.20421 83 | 6.3557,0.67861 84 | 9.7687,7.5435 85 | 6.5159,5.3436 86 | 8.5172,4.2415 87 | 9.1802,6.7981 88 | 6.002,0.92695 89 | 5.5204,0.152 90 | 5.0594,2.8214 91 | 5.7077,1.8451 92 | 7.6366,4.2959 93 | 5.8707,7.2029 94 | 5.3054,1.9869 95 | 8.2934,0.14454 96 | 13.394,9.0551 97 | 5.4369,0.61705 98 | -------------------------------------------------------------------------------- /Week 2 - Linear Regression/ex1data2.csv: -------------------------------------------------------------------------------- 1 | 2104,3,399900 2 | 1600,3,329900 3 | 2400,3,369000 4 | 1416,2,232000 5 | 3000,4,539900 6 | 1985,4,299900 7 | 1534,3,314900 8 | 1427,3,198999 9 | 1380,3,212000 10 | 1494,3,242500 11 | 1940,4,239999 12 | 2000,3,347000 13 | 1890,3,329999 14 | 4478,5,699900 15 | 1268,3,259900 16 | 2300,4,449900 17 | 1320,2,299900 18 | 1236,3,199900 19 | 2609,4,499998 20 | 3031,4,599000 21 | 1767,3,252900 22 | 1888,2,255000 23 | 1604,3,242900 24 | 1962,4,259900 25 | 3890,3,573900 26 | 1100,3,249900 27 | 1458,3,464500 28 | 2526,3,469000 29 | 2200,3,475000 30 | 2637,3,299900 31 | 1839,2,349900 32 | 1000,1,169900 33 | 2040,4,314900 34 | 3137,3,579900 35 | 1811,4,285900 36 | 1437,3,249900 37 | 1239,3,229900 38 | 2132,4,345000 39 | 4215,4,549000 40 | 2162,4,287000 41 | 1664,2,368500 42 | 2238,3,329900 43 | 2567,4,314000 44 | 1200,3,299000 45 | 852,2,179900 46 | 1852,4,299900 47 | 1203,3,239500 48 | -------------------------------------------------------------------------------- /Week 2 - Linear Regression/img/alpha_cost.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 2 - Linear Regression/img/alpha_cost.JPG -------------------------------------------------------------------------------- /Week 2 - Linear Regression/img/h.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 2 - Linear Regression/img/h.JPG -------------------------------------------------------------------------------- /Week 2 - Linear Regression/img/j.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 2 - Linear Regression/img/j.JPG -------------------------------------------------------------------------------- /Week 2 - Linear Regression/img/jmult.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 2 - Linear Regression/img/jmult.JPG -------------------------------------------------------------------------------- /Week 2 - Linear Regression/img/jmult_p.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 2 - Linear Regression/img/jmult_p.JPG -------------------------------------------------------------------------------- /Week 2 - Linear Regression/img/normal.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 2 - Linear Regression/img/normal.JPG -------------------------------------------------------------------------------- /Week 2 - Linear Regression/img/thta.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 2 - Linear Regression/img/thta.JPG -------------------------------------------------------------------------------- /Week 3 - Logistic Regression/ex2data1.csv: -------------------------------------------------------------------------------- 1 | 34.62365962451697,78.0246928153624,0 2 | 30.28671076822607,43.89499752400101,0 3 | 35.84740876993872,72.90219802708364,0 4 | 60.18259938620976,86.30855209546826,1 5 | 79.0327360507101,75.3443764369103,1 6 | 45.08327747668339,56.3163717815305,0 7 | 61.10666453684766,96.51142588489624,1 8 | 75.02474556738889,46.55401354116538,1 9 | 76.09878670226257,87.42056971926803,1 10 | 84.43281996120035,43.53339331072109,1 11 | 95.86155507093572,38.22527805795094,0 12 | 75.01365838958247,30.60326323428011,0 13 | 82.30705337399482,76.48196330235604,1 14 | 69.36458875970939,97.71869196188608,1 15 | 39.53833914367223,76.03681085115882,0 16 | 53.9710521485623,89.20735013750205,1 17 | 69.07014406283025,52.74046973016765,1 18 | 67.94685547711617,46.67857410673128,0 19 | 70.66150955499435,92.92713789364831,1 20 | 76.97878372747498,47.57596364975532,1 21 | 67.37202754570876,42.83843832029179,0 22 | 89.67677575072079,65.79936592745237,1 23 | 50.534788289883,48.85581152764205,0 24 | 34.21206097786789,44.20952859866288,0 25 | 77.9240914545704,68.9723599933059,1 26 | 62.27101367004632,69.95445795447587,1 27 | 80.1901807509566,44.82162893218353,1 28 | 93.114388797442,38.80067033713209,0 29 | 61.83020602312595,50.25610789244621,0 30 | 38.78580379679423,64.99568095539578,0 31 | 61.379289447425,72.80788731317097,1 32 | 85.40451939411645,57.05198397627122,1 33 | 52.10797973193984,63.12762376881715,0 34 | 52.04540476831827,69.43286012045222,1 35 | 40.23689373545111,71.16774802184875,0 36 | 54.63510555424817,52.21388588061123,0 37 | 33.91550010906887,98.86943574220611,0 38 | 64.17698887494485,80.90806058670817,1 39 | 74.78925295941542,41.57341522824434,0 40 | 34.1836400264419,75.2377203360134,0 41 | 83.90239366249155,56.30804621605327,1 42 | 51.54772026906181,46.85629026349976,0 43 | 94.44336776917852,65.56892160559052,1 44 | 82.36875375713919,40.61825515970618,0 45 | 51.04775177128865,45.82270145776001,0 46 | 62.22267576120188,52.06099194836679,0 47 | 77.19303492601364,70.45820000180959,1 48 | 97.77159928000232,86.7278223300282,1 49 | 62.07306379667647,96.76882412413983,1 50 | 91.56497449807442,88.69629254546599,1 51 | 79.94481794066932,74.16311935043758,1 52 | 99.2725269292572,60.99903099844988,1 53 | 90.54671411399852,43.39060180650027,1 54 | 34.52451385320009,60.39634245837173,0 55 | 50.2864961189907,49.80453881323059,0 56 | 49.58667721632031,59.80895099453265,0 57 | 97.64563396007767,68.86157272420604,1 58 | 32.57720016809309,95.59854761387875,0 59 | 74.24869136721598,69.82457122657193,1 60 | 71.79646205863379,78.45356224515052,1 61 | 75.3956114656803,85.75993667331619,1 62 | 35.28611281526193,47.02051394723416,0 63 | 56.25381749711624,39.26147251058019,0 64 | 30.05882244669796,49.59297386723685,0 65 | 44.66826172480893,66.45008614558913,0 66 | 66.56089447242954,41.09209807936973,0 67 | 40.45755098375164,97.53518548909936,1 68 | 49.07256321908844,51.88321182073966,0 69 | 80.27957401466998,92.11606081344084,1 70 | 66.74671856944039,60.99139402740988,1 71 | 32.72283304060323,43.30717306430063,0 72 | 64.0393204150601,78.03168802018232,1 73 | 72.34649422579923,96.22759296761404,1 74 | 60.45788573918959,73.09499809758037,1 75 | 58.84095621726802,75.85844831279042,1 76 | 99.82785779692128,72.36925193383885,1 77 | 47.26426910848174,88.47586499559782,1 78 | 50.45815980285988,75.80985952982456,1 79 | 60.45555629271532,42.50840943572217,0 80 | 82.22666157785568,42.71987853716458,0 81 | 88.9138964166533,69.80378889835472,1 82 | 94.83450672430196,45.69430680250754,1 83 | 67.31925746917527,66.58935317747915,1 84 | 57.23870631569862,59.51428198012956,1 85 | 80.36675600171273,90.96014789746954,1 86 | 68.46852178591112,85.59430710452014,1 87 | 42.0754545384731,78.84478600148043,0 88 | 75.47770200533905,90.42453899753964,1 89 | 78.63542434898018,96.64742716885644,1 90 | 52.34800398794107,60.76950525602592,0 91 | 94.09433112516793,77.15910509073893,1 92 | 90.44855097096364,87.50879176484702,1 93 | 55.48216114069585,35.57070347228866,0 94 | 74.49269241843041,84.84513684930135,1 95 | 89.84580670720979,45.35828361091658,1 96 | 83.48916274498238,48.38028579728175,1 97 | 42.2617008099817,87.10385094025457,1 98 | 99.31500880510394,68.77540947206617,1 99 | 55.34001756003703,64.9319380069486,1 100 | 74.77589300092767,89.52981289513276,1 -------------------------------------------------------------------------------- /Week 3 - Logistic Regression/ex2data2.csv: -------------------------------------------------------------------------------- 1 | 0.051267,0.69956,1 2 | -0.092742,0.68494,1 3 | -0.21371,0.69225,1 4 | -0.375,0.50219,1 5 | -0.51325,0.46564,1 6 | -0.52477,0.2098,1 7 | -0.39804,0.034357,1 8 | -0.30588,-0.19225,1 9 | 0.016705,-0.40424,1 10 | 0.13191,-0.51389,1 11 | 0.38537,-0.56506,1 12 | 0.52938,-0.5212,1 13 | 0.63882,-0.24342,1 14 | 0.73675,-0.18494,1 15 | 0.54666,0.48757,1 16 | 0.322,0.5826,1 17 | 0.16647,0.53874,1 18 | -0.046659,0.81652,1 19 | -0.17339,0.69956,1 20 | -0.47869,0.63377,1 21 | -0.60541,0.59722,1 22 | -0.62846,0.33406,1 23 | -0.59389,0.005117,1 24 | -0.42108,-0.27266,1 25 | -0.11578,-0.39693,1 26 | 0.20104,-0.60161,1 27 | 0.46601,-0.53582,1 28 | 0.67339,-0.53582,1 29 | -0.13882,0.54605,1 30 | -0.29435,0.77997,1 31 | -0.26555,0.96272,1 32 | -0.16187,0.8019,1 33 | -0.17339,0.64839,1 34 | -0.28283,0.47295,1 35 | -0.36348,0.31213,1 36 | -0.30012,0.027047,1 37 | -0.23675,-0.21418,1 38 | -0.06394,-0.18494,1 39 | 0.062788,-0.16301,1 40 | 0.22984,-0.41155,1 41 | 0.2932,-0.2288,1 42 | 0.48329,-0.18494,1 43 | 0.64459,-0.14108,1 44 | 0.46025,0.012427,1 45 | 0.6273,0.15863,1 46 | 0.57546,0.26827,1 47 | 0.72523,0.44371,1 48 | 0.22408,0.52412,1 49 | 0.44297,0.67032,1 50 | 0.322,0.69225,1 51 | 0.13767,0.57529,1 52 | -0.0063364,0.39985,1 53 | -0.092742,0.55336,1 54 | -0.20795,0.35599,1 55 | -0.20795,0.17325,1 56 | -0.43836,0.21711,1 57 | -0.21947,-0.016813,1 58 | -0.13882,-0.27266,1 59 | 0.18376,0.93348,0 60 | 0.22408,0.77997,0 61 | 0.29896,0.61915,0 62 | 0.50634,0.75804,0 63 | 0.61578,0.7288,0 64 | 0.60426,0.59722,0 65 | 0.76555,0.50219,0 66 | 0.92684,0.3633,0 67 | 0.82316,0.27558,0 68 | 0.96141,0.085526,0 69 | 0.93836,0.012427,0 70 | 0.86348,-0.082602,0 71 | 0.89804,-0.20687,0 72 | 0.85196,-0.36769,0 73 | 0.82892,-0.5212,0 74 | 0.79435,-0.55775,0 75 | 0.59274,-0.7405,0 76 | 0.51786,-0.5943,0 77 | 0.46601,-0.41886,0 78 | 0.35081,-0.57968,0 79 | 0.28744,-0.76974,0 80 | 0.085829,-0.75512,0 81 | 0.14919,-0.57968,0 82 | -0.13306,-0.4481,0 83 | -0.40956,-0.41155,0 84 | -0.39228,-0.25804,0 85 | -0.74366,-0.25804,0 86 | -0.69758,0.041667,0 87 | -0.75518,0.2902,0 88 | -0.69758,0.68494,0 89 | -0.4038,0.70687,0 90 | -0.38076,0.91886,0 91 | -0.50749,0.90424,0 92 | -0.54781,0.70687,0 93 | 0.10311,0.77997,0 94 | 0.057028,0.91886,0 95 | -0.10426,0.99196,0 96 | -0.081221,1.1089,0 97 | 0.28744,1.087,0 98 | 0.39689,0.82383,0 99 | 0.63882,0.88962,0 100 | 0.82316,0.66301,0 101 | 0.67339,0.64108,0 102 | 1.0709,0.10015,0 103 | -0.046659,-0.57968,0 104 | -0.23675,-0.63816,0 105 | -0.15035,-0.36769,0 106 | -0.49021,-0.3019,0 107 | -0.46717,-0.13377,0 108 | -0.28859,-0.060673,0 109 | -0.61118,-0.067982,0 110 | -0.66302,-0.21418,0 111 | -0.59965,-0.41886,0 112 | -0.72638,-0.082602,0 113 | -0.83007,0.31213,0 114 | -0.72062,0.53874,0 115 | -0.59389,0.49488,0 116 | -0.48445,0.99927,0 117 | -0.0063364,0.99927,0 118 | 0.63265,-0.030612,0 -------------------------------------------------------------------------------- /Week 3 - Logistic Regression/img/fit.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 3 - Logistic Regression/img/fit.JPG -------------------------------------------------------------------------------- /Week 3 - Logistic Regression/img/gradient.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 3 - Logistic Regression/img/gradient.JPG -------------------------------------------------------------------------------- /Week 3 - Logistic Regression/img/gradient_reg.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 3 - Logistic Regression/img/gradient_reg.JPG -------------------------------------------------------------------------------- /Week 3 - Logistic Regression/img/gradient_reg_.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 3 - Logistic Regression/img/gradient_reg_.JPG -------------------------------------------------------------------------------- /Week 3 - Logistic Regression/img/j.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 3 - Logistic Regression/img/j.JPG -------------------------------------------------------------------------------- /Week 3 - Logistic Regression/img/j_reg.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 3 - Logistic Regression/img/j_reg.JPG -------------------------------------------------------------------------------- /Week 3 - Logistic Regression/img/lr-h.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 3 - Logistic Regression/img/lr-h.JPG -------------------------------------------------------------------------------- /Week 3 - Logistic Regression/img/map_feature.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 3 - Logistic Regression/img/map_feature.JPG -------------------------------------------------------------------------------- /Week 3 - Logistic Regression/img/sigmoid.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 3 - Logistic Regression/img/sigmoid.JPG -------------------------------------------------------------------------------- /Week 4 - Multi-Class Classification and Neural Networks/Neural Networks.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "metadata": {}, 6 | "source": [ 7 | "# Neural Networks\n", 8 | "In the previous part of this exercise, you implemented multi-class logistic re gression to recognize handwritten digits. However, logistic regression cannot form more complex hypotheses as it is only a linear classifier.

\n", 9 | "\n", 10 | "In this part of the exercise, you will implement a neural network to recognize handwritten digits using the same training set as before. The neural network will be able to represent complex models that form non-linear hypotheses. For this week, you will be using parameters from a neural network that we have already trained. Your goal is to implement the feedforward propagation algorithm to use our weights for prediction. In next week’s exercise, you will write the backpropagation algorithm for learning the neural network parameters.

\n", 11 | "\n", 12 | "The file ex3data1 contains a training set.
\n", 13 | "The structure of the dataset described blow:
\n", 14 | "1. X array = 400 columns describe the values of pixels of 20*20 images in flatten format for 5000 samples\n", 15 | "2. y array = Value of image (number between 0-9)\n", 16 | "\n", 17 | "\n", 18 | "

\n", 19 | "\n", 20 | "Our assignment has these sections:\n", 21 | "1. Visualizing the Data\n", 22 | " 1. Converting .mat to .csv\n", 23 | " 2. Loading Dataset and Trained Neural Network Weights\n", 24 | " 3. Ploting Data\n", 25 | "2. Model Representation\n", 26 | "3. Feedforward Propagation and Prediction\n", 27 | "\n", 28 | "\n", 29 | "In each section full description provided." 30 | ] 31 | }, 32 | { 33 | "cell_type": "markdown", 34 | "metadata": {}, 35 | "source": [ 36 | "## 1. Visualizing the Dataset\n", 37 | "Before starting on any task, it is often useful to understand the data by visualizing it.
" 38 | ] 39 | }, 40 | { 41 | "cell_type": "markdown", 42 | "metadata": {}, 43 | "source": [ 44 | "### 1.A Converting .mat to .csv\n", 45 | "In this specific assignment, the instructor added a .mat file as training set and weights of trained neural network. But we have to convert it to .csv to use in python.
\n", 46 | "After all we now ready to import our new csv files to pandas dataframes and do preprocessing on it and make it ready for next steps." 47 | ] 48 | }, 49 | { 50 | "cell_type": "code", 51 | "execution_count": 2, 52 | "metadata": {}, 53 | "outputs": [], 54 | "source": [ 55 | "# import libraries\n", 56 | "import scipy.io\n", 57 | "import numpy as np\n", 58 | "\n", 59 | "data = scipy.io.loadmat(\"ex3data1\")\n", 60 | "weights = scipy.io.loadmat('ex3weights')" 61 | ] 62 | }, 63 | { 64 | "cell_type": "markdown", 65 | "metadata": {}, 66 | "source": [ 67 | "Now we extract X and y variables from the .mat file and save them into .csv file for further usage. After running the below code you should see X.csv and y.csv files in your directory." 68 | ] 69 | }, 70 | { 71 | "cell_type": "code", 72 | "execution_count": 3, 73 | "metadata": {}, 74 | "outputs": [], 75 | "source": [ 76 | "for i in data:\n", 77 | " if '__' not in i and 'readme' not in i:\n", 78 | " np.savetxt((i+\".csv\"),data[i],delimiter=',')\n", 79 | " \n", 80 | "for i in weights:\n", 81 | " if '__' not in i and 'readme' not in i:\n", 82 | " np.savetxt((i+\".csv\"),weights[i],delimiter=',')" 83 | ] 84 | }, 85 | { 86 | "cell_type": "markdown", 87 | "metadata": {}, 88 | "source": [ 89 | "### 1.B Loading Dataset and Trained Neural Network Weights\n", 90 | "First we import .csv files into pandas dataframes then save them into numpy arrays.

\n", 91 | "There are 5000 training examples in ex3data1.mat, where each training example is a 20 pixel by 20 pixel grayscale image of the digit. Each pixel is represented by a floating point number indicating the grayscale intensity at that location. The 20 by 20 grid of pixels is \"flatten\" into a 400-dimensional vector. Each of these training examples becomes a single row in our data matrix X. This gives us a 5000 by 400 matrix X where every row is a training example for a handwritten digit image.

\n", 92 | "The second part of the training set is a 5000-dimensional vector y that contains labels for the training set.

\n", 93 | "Notice: In dataset, the digit zero mapped to the value ten. Therefore, a \"0\" digit is labeled as \"10\", while the digits \"1\" to \"9\" are labeled as \"1\" to \"9\" in their natural order.
\n", 94 | "But this make thing harder so we bring it back to natural order for 0!" 95 | ] 96 | }, 97 | { 98 | "cell_type": "code", 99 | "execution_count": 4, 100 | "metadata": {}, 101 | "outputs": [], 102 | "source": [ 103 | "# import library\n", 104 | "import pandas as pd\n", 105 | "\n", 106 | "# saving .csv files to pandas dataframes\n", 107 | "x_df = pd.read_csv('X.csv',names= np.arange(0,400))\n", 108 | "y_df = pd.read_csv('y.csv',names=['label'])" 109 | ] 110 | }, 111 | { 112 | "cell_type": "code", 113 | "execution_count": 5, 114 | "metadata": {}, 115 | "outputs": [], 116 | "source": [ 117 | "# saving .csv files to pandas dataframes\n", 118 | "Theta1_df = pd.read_csv('Theta1.csv',names = np.arange(0,401))\n", 119 | "Theta2_df = pd.read_csv('Theta2.csv',names = np.arange(0,26))" 120 | ] 121 | }, 122 | { 123 | "cell_type": "code", 124 | "execution_count": 6, 125 | "metadata": {}, 126 | "outputs": [ 127 | { 128 | "name": "stdout", 129 | "output_type": "stream", 130 | "text": [ 131 | "#5000 Number of training samples, #400 features per sample\n" 132 | ] 133 | } 134 | ], 135 | "source": [ 136 | "# saving x_df and y_df into numpy arrays\n", 137 | "x = x_df.iloc[:,:].values\n", 138 | "y = y_df.iloc[:,:].values\n", 139 | "\n", 140 | "m, n = x.shape\n", 141 | "\n", 142 | "# bring back 0 to 0 !!!\n", 143 | "y = y.reshape(m,)\n", 144 | "y[y==10] = 0\n", 145 | "y = y.reshape(m,1)\n", 146 | "\n", 147 | "print('#{} Number of training samples, #{} features per sample'.format(m,n))" 148 | ] 149 | }, 150 | { 151 | "cell_type": "code", 152 | "execution_count": 7, 153 | "metadata": {}, 154 | "outputs": [], 155 | "source": [ 156 | "# saving Theta1_df and Theta2_df into numpy arrays\n", 157 | "theta1 = Theta1_df.iloc[:,:].values\n", 158 | "theta2 = Theta2_df.iloc[:,:].values" 159 | ] 160 | }, 161 | { 162 | "cell_type": "markdown", 163 | "metadata": {}, 164 | "source": [ 165 | "### 1.C Plotting Data\n", 166 | "You will begin by visualizing a subset of the training set. In first part, the code randomly selects selects 100 rows from X and passes those rows to the display_data function. This function maps each row to a 20 pixel by 20 pixel grayscale image and displays the images together.
\n", 167 | "After plotting, you should see an image like this:" 168 | ] 169 | }, 170 | { 171 | "cell_type": "code", 172 | "execution_count": 8, 173 | "metadata": {}, 174 | "outputs": [ 175 | { 176 | "data": { 177 | "text/plain": [ 178 | "
" 179 | ] 180 | }, 181 | "metadata": {}, 182 | "output_type": "display_data" 183 | }, 184 | { 185 | "name": "stdout", 186 | "output_type": "stream", 187 | "text": [ 188 | "[ 5. 0. 3. 1. 4. 2. 3. 3. 6. 5. 3. 0. 1. 2. 4. 1. 9. 0.\n", 189 | " 6. 5. 4. 2. 2. 4. 4. 7. 6. 7. 4. 5. 6. 5. 2. 4. 5. 9.\n", 190 | " 3. 2. 8. 4. 1. 4. 0. 0. 8. 5. 7. 4. 6. 4. 1. 8. 9. 7.\n", 191 | " 0. 1. 2. 9. 5. 8. 2. 7. 5. 5. 8. 7. 6. 6. 8. 4. 3. 4.\n", 192 | " 9. 2. 1. 1. 3. 3. 7. 0. 8. 6. 2. 3. 8. 1. 6. 1. 9. 0.\n", 193 | " 1. 6. 6. 5. 0. 8. 5. 6. 4. 7.]\n" 194 | ] 195 | } 196 | ], 197 | "source": [ 198 | "import numpy as np\n", 199 | "import matplotlib.pyplot as plt\n", 200 | "import random\n", 201 | "\n", 202 | "amount = 100\n", 203 | "lines = 10\n", 204 | "columns = 10\n", 205 | "image = np.zeros((amount, 20, 20))\n", 206 | "number = np.zeros(amount)\n", 207 | "\n", 208 | "for i in range(amount):\n", 209 | " rnd = random.randint(0,4999)\n", 210 | " image[i] = x[rnd].reshape(20, 20)\n", 211 | " y_temp = y.reshape(m,)\n", 212 | " number[i] = y_temp[rnd]\n", 213 | "fig = plt.figure(figsize=(8,8))\n", 214 | "\n", 215 | "for i in range(amount):\n", 216 | " ax = fig.add_subplot(lines, columns, 1 + i)\n", 217 | " \n", 218 | " # Turn off tick labels\n", 219 | " ax.set_yticklabels([])\n", 220 | " ax.set_xticklabels([])\n", 221 | " plt.imshow(image[i], cmap='binary')\n", 222 | "plt.show()\n", 223 | "print(number)" 224 | ] 225 | }, 226 | { 227 | "cell_type": "markdown", 228 | "metadata": {}, 229 | "source": [ 230 | "# 2. Model Representation\n", 231 | "Our neural network is shown in below figure. It has 3 layers an input layer, a hidden layer and an output layer. Recall that our inputs are pixel values of digit images. Since the images are of size 20×20, this gives us 400 input layer units (excluding the extra bias unit which always outputs +1).


\n", 232 | "You have been provided with a set of network parameters (Θ(1); Θ(2)) already trained by instructor.

\n", 233 | "Theta1 and Theta2 The parameters have dimensions that are sized for a neural network with 25 units in the second layer and 10 output units (corresponding to the 10 digit classes)." 234 | ] 235 | }, 236 | { 237 | "cell_type": "code", 238 | "execution_count": 9, 239 | "metadata": {}, 240 | "outputs": [ 241 | { 242 | "name": "stdout", 243 | "output_type": "stream", 244 | "text": [ 245 | "theta1 shape = (25, 401), theta2 shape = (10, 26)\n" 246 | ] 247 | } 248 | ], 249 | "source": [ 250 | "print('theta1 shape = {}, theta2 shape = {}'.format(theta1.shape,theta2.shape))" 251 | ] 252 | }, 253 | { 254 | "cell_type": "markdown", 255 | "metadata": {}, 256 | "source": [ 257 | "It seems our weights are transposed, so we transpose them to have them in a way our neural network is." 258 | ] 259 | }, 260 | { 261 | "cell_type": "code", 262 | "execution_count": 10, 263 | "metadata": {}, 264 | "outputs": [ 265 | { 266 | "name": "stdout", 267 | "output_type": "stream", 268 | "text": [ 269 | "theta1 shape = (401, 25), theta2 shape = (26, 10)\n" 270 | ] 271 | } 272 | ], 273 | "source": [ 274 | "theta1 = theta1.transpose()\n", 275 | "theta2 = theta2.transpose()\n", 276 | "print('theta1 shape = {}, theta2 shape = {}'.format(theta1.shape,theta2.shape))" 277 | ] 278 | }, 279 | { 280 | "cell_type": "markdown", 281 | "metadata": {}, 282 | "source": [ 283 | "# 3. Feedforward Propagation and Prediction\n", 284 | "Now you will implement feedforward propagation for the neural network.
\n", 285 | "You should implement the feedforward computation that computes hθ(x(i)) for every example i and returns the associated predictions. Similar to the one-vs-all classification strategy, the prediction from the neural network will be the label that has the largest output hθ(x)k." 286 | ] 287 | }, 288 | { 289 | "cell_type": "markdown", 290 | "metadata": {}, 291 | "source": [ 292 | "Implementation Note: The matrix X contains the examples in rows. When you complete the code, you will need to add the column of 1’s to the matrix. The matrices Theta1 and Theta2 contain the parameters for each unit in rows. Specifically, the first row of Theta1 corresponds to the first hidden unit in the second layer.
\n", 293 | "You must get a(l) as a column vector.

\n", 294 | "You should see that the accuracy is about 97.5%." 295 | ] 296 | }, 297 | { 298 | "cell_type": "code", 299 | "execution_count": 11, 300 | "metadata": {}, 301 | "outputs": [], 302 | "source": [ 303 | "# adding column of 1's to x\n", 304 | "x = np.append(np.ones(shape=(m,1)),x,axis = 1)" 305 | ] 306 | }, 307 | { 308 | "cell_type": "markdown", 309 | "metadata": {}, 310 | "source": [ 311 | "h = hypothesis(x,theta) will compute sigmoid function on θTX and return a number which 0<=h<=1.
\n", 312 | "You can use this library for calculating sigmoid." 313 | ] 314 | }, 315 | { 316 | "cell_type": "code", 317 | "execution_count": 12, 318 | "metadata": {}, 319 | "outputs": [], 320 | "source": [ 321 | "def sigmoid(z):\n", 322 | " return 1/(1+np.exp(-z))" 323 | ] 324 | }, 325 | { 326 | "cell_type": "code", 327 | "execution_count": 13, 328 | "metadata": {}, 329 | "outputs": [], 330 | "source": [ 331 | "def lr_hypothesis(x,theta):\n", 332 | " return np.dot(x,theta)" 333 | ] 334 | }, 335 | { 336 | "cell_type": "markdown", 337 | "metadata": {}, 338 | "source": [ 339 | "predict(theta1, theta2, x): outputs the predicted label of x given the trained weights of a neural network (theta1, theta2)." 340 | ] 341 | }, 342 | { 343 | "cell_type": "code", 344 | "execution_count": 14, 345 | "metadata": {}, 346 | "outputs": [], 347 | "source": [ 348 | "layers = 3\n", 349 | "num_labels = 10" 350 | ] 351 | }, 352 | { 353 | "cell_type": "markdown", 354 | "metadata": {}, 355 | "source": [ 356 | "Becuase the initial dataset has changed and mapped 0 to \"10\", so the weights also are changed. So we just rotate columns one step to right, to predict correct values.
\n", 357 | "Recall we have changed mapping 0 to \"10\" to 0 to \"0\" but we cannot detect this mapping in weights of neural netwrok. So we have to this rotation on final output of probabilities.
" 358 | ] 359 | }, 360 | { 361 | "cell_type": "code", 362 | "execution_count": 34, 363 | "metadata": {}, 364 | "outputs": [], 365 | "source": [ 366 | "def rotate_column(array):\n", 367 | " array_ = np.zeros(shape=(m,num_labels))\n", 368 | " temp = np.zeros(num_labels,)\n", 369 | " temp= array[:,9]\n", 370 | " array_[:,1:10] = array[:,0:9]\n", 371 | " array_[:,0] = temp\n", 372 | " return array_" 373 | ] 374 | }, 375 | { 376 | "cell_type": "code", 377 | "execution_count": 35, 378 | "metadata": {}, 379 | "outputs": [], 380 | "source": [ 381 | "def predict(theta1,theta2,x):\n", 382 | " z2 = np.dot(x,theta1) # hidden layer\n", 383 | " a2 = sigmoid(z2) # hidden layer\n", 384 | "\n", 385 | " # adding column of 1's to a2\n", 386 | " a2 = np.append(np.ones(shape=(m,1)),a2,axis = 1)\n", 387 | " z3 = np.dot(a2,theta2)\n", 388 | " a3 = sigmoid(z3)\n", 389 | " \n", 390 | " # mapping problem. Rotate left one step\n", 391 | " y_prob = rotate_column(a3)\n", 392 | " \n", 393 | " # prediction on activation a2\n", 394 | " y_pred = np.argmax(y_prob, axis=1).reshape(-1,1)\n", 395 | " return y_pred" 396 | ] 397 | }, 398 | { 399 | "cell_type": "code", 400 | "execution_count": 36, 401 | "metadata": {}, 402 | "outputs": [ 403 | { 404 | "data": { 405 | "text/plain": [ 406 | "(5000, 1)" 407 | ] 408 | }, 409 | "execution_count": 36, 410 | "metadata": {}, 411 | "output_type": "execute_result" 412 | } 413 | ], 414 | "source": [ 415 | "y_pred = predict(theta1,theta2,x)\n", 416 | "y_pred.shape" 417 | ] 418 | }, 419 | { 420 | "cell_type": "markdown", 421 | "metadata": {}, 422 | "source": [ 423 | "Now we will compare our predicted result to the true one with confusion_matrix of numpy library." 424 | ] 425 | }, 426 | { 427 | "cell_type": "code", 428 | "execution_count": 37, 429 | "metadata": {}, 430 | "outputs": [], 431 | "source": [ 432 | "from sklearn.metrics import confusion_matrix\n", 433 | "\n", 434 | "# Function for accuracy\n", 435 | "def acc(confusion_matrix):\n", 436 | " t = 0\n", 437 | " for i in range(num_labels):\n", 438 | " t += confusion_matrix[i][i]\n", 439 | " f = m-t\n", 440 | " ac = t/(m)\n", 441 | " return (t,f,ac)" 442 | ] 443 | }, 444 | { 445 | "cell_type": "code", 446 | "execution_count": 38, 447 | "metadata": {}, 448 | "outputs": [ 449 | { 450 | "name": "stdout", 451 | "output_type": "stream", 452 | "text": [ 453 | "With #4876 correct, #124 wrong ==========> accuracy = 97.52%\n" 454 | ] 455 | } 456 | ], 457 | "source": [ 458 | "#import library\n", 459 | "from sklearn.metrics import confusion_matrix\n", 460 | "cm_train = confusion_matrix(y.reshape(m,),y_pred.reshape(m,))\n", 461 | "t,f,ac = acc(cm_train)\n", 462 | "print('With #{} correct, #{} wrong ==========> accuracy = {}%'\n", 463 | " .format(t,f,ac*100))" 464 | ] 465 | }, 466 | { 467 | "cell_type": "code", 468 | "execution_count": 39, 469 | "metadata": {}, 470 | "outputs": [ 471 | { 472 | "data": { 473 | "text/plain": [ 474 | "array([[496, 0, 0, 0, 1, 0, 1, 0, 1, 1],\n", 475 | " [ 0, 491, 1, 1, 2, 0, 0, 1, 3, 1],\n", 476 | " [ 3, 1, 485, 0, 3, 1, 3, 1, 2, 1],\n", 477 | " [ 0, 2, 2, 480, 0, 8, 1, 4, 1, 2],\n", 478 | " [ 0, 2, 2, 0, 484, 0, 3, 0, 1, 8],\n", 479 | " [ 0, 0, 1, 4, 1, 492, 2, 0, 0, 0],\n", 480 | " [ 2, 2, 0, 0, 0, 3, 493, 0, 0, 0],\n", 481 | " [ 1, 3, 2, 1, 4, 0, 0, 485, 0, 4],\n", 482 | " [ 0, 4, 1, 1, 2, 1, 0, 0, 491, 0],\n", 483 | " [ 3, 2, 0, 4, 2, 1, 1, 5, 3, 479]], dtype=int64)" 484 | ] 485 | }, 486 | "execution_count": 39, 487 | "metadata": {}, 488 | "output_type": "execute_result" 489 | } 490 | ], 491 | "source": [ 492 | "cm_train" 493 | ] 494 | } 495 | ], 496 | "metadata": { 497 | "kernelspec": { 498 | "display_name": "Python 3", 499 | "language": "python", 500 | "name": "python3" 501 | }, 502 | "language_info": { 503 | "codemirror_mode": { 504 | "name": "ipython", 505 | "version": 3 506 | }, 507 | "file_extension": ".py", 508 | "mimetype": "text/x-python", 509 | "name": "python", 510 | "nbconvert_exporter": "python", 511 | "pygments_lexer": "ipython3", 512 | "version": "3.6.6" 513 | } 514 | }, 515 | "nbformat": 4, 516 | "nbformat_minor": 2 517 | } 518 | -------------------------------------------------------------------------------- /Week 4 - Multi-Class Classification and Neural Networks/ex3data1.mat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 4 - Multi-Class Classification and Neural Networks/ex3data1.mat -------------------------------------------------------------------------------- /Week 4 - Multi-Class Classification and Neural Networks/ex3weights.mat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 4 - Multi-Class Classification and Neural Networks/ex3weights.mat -------------------------------------------------------------------------------- /Week 4 - Multi-Class Classification and Neural Networks/img/bx.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 4 - Multi-Class Classification and Neural Networks/img/bx.JPG -------------------------------------------------------------------------------- /Week 4 - Multi-Class Classification and Neural Networks/img/fullgrad.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 4 - Multi-Class Classification and Neural Networks/img/fullgrad.JPG -------------------------------------------------------------------------------- /Week 4 - Multi-Class Classification and Neural Networks/img/grad.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 4 - Multi-Class Classification and Neural Networks/img/grad.JPG -------------------------------------------------------------------------------- /Week 4 - Multi-Class Classification and Neural Networks/img/h-y.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 4 - Multi-Class Classification and Neural Networks/img/h-y.JPG -------------------------------------------------------------------------------- /Week 4 - Multi-Class Classification and Neural Networks/img/j.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 4 - Multi-Class Classification and Neural Networks/img/j.JPG -------------------------------------------------------------------------------- /Week 4 - Multi-Class Classification and Neural Networks/img/nn.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 4 - Multi-Class Classification and Neural Networks/img/nn.JPG -------------------------------------------------------------------------------- /Week 4 - Multi-Class Classification and Neural Networks/img/plot.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 4 - Multi-Class Classification and Neural Networks/img/plot.JPG -------------------------------------------------------------------------------- /Week 4 - Multi-Class Classification and Neural Networks/img/x.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 4 - Multi-Class Classification and Neural Networks/img/x.JPG -------------------------------------------------------------------------------- /Week 4 - Multi-Class Classification and Neural Networks/img/xandtheta.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 4 - Multi-Class Classification and Neural Networks/img/xandtheta.JPG -------------------------------------------------------------------------------- /Week 4 - Multi-Class Classification and Neural Networks/img/xtheta.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 4 - Multi-Class Classification and Neural Networks/img/xtheta.JPG -------------------------------------------------------------------------------- /Week 5 - Neural Networks Learning/ex4data1.mat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 5 - Neural Networks Learning/ex4data1.mat -------------------------------------------------------------------------------- /Week 5 - Neural Networks Learning/ex4weights.mat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 5 - Neural Networks Learning/ex4weights.mat -------------------------------------------------------------------------------- /Week 5 - Neural Networks Learning/img/acc_grad.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 5 - Neural Networks Learning/img/acc_grad.JPG -------------------------------------------------------------------------------- /Week 5 - Neural Networks Learning/img/backprop.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 5 - Neural Networks Learning/img/backprop.JPG -------------------------------------------------------------------------------- /Week 5 - Neural Networks Learning/img/delta.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 5 - Neural Networks Learning/img/delta.JPG -------------------------------------------------------------------------------- /Week 5 - Neural Networks Learning/img/dj.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 5 - Neural Networks Learning/img/dj.JPG -------------------------------------------------------------------------------- /Week 5 - Neural Networks Learning/img/fi.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 5 - Neural Networks Learning/img/fi.JPG -------------------------------------------------------------------------------- /Week 5 - Neural Networks Learning/img/full_grad.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 5 - Neural Networks Learning/img/full_grad.JPG -------------------------------------------------------------------------------- /Week 5 - Neural Networks Learning/img/g_grad.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 5 - Neural Networks Learning/img/g_grad.JPG -------------------------------------------------------------------------------- /Week 5 - Neural Networks Learning/img/grad_reg.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 5 - Neural Networks Learning/img/grad_reg.JPG -------------------------------------------------------------------------------- /Week 5 - Neural Networks Learning/img/hidden_backprop.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 5 - Neural Networks Learning/img/hidden_backprop.JPG -------------------------------------------------------------------------------- /Week 5 - Neural Networks Learning/img/j_reg.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 5 - Neural Networks Learning/img/j_reg.JPG -------------------------------------------------------------------------------- /Week 5 - Neural Networks Learning/img/nn.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 5 - Neural Networks Learning/img/nn.JPG -------------------------------------------------------------------------------- /Week 5 - Neural Networks Learning/img/plot.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 5 - Neural Networks Learning/img/plot.JPG -------------------------------------------------------------------------------- /Week 5 - Neural Networks Learning/img/sig.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 5 - Neural Networks Learning/img/sig.JPG -------------------------------------------------------------------------------- /Week 5 - Neural Networks Learning/img/theta_dif.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 5 - Neural Networks Learning/img/theta_dif.JPG -------------------------------------------------------------------------------- /Week 5 - Neural Networks Learning/img/x.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 5 - Neural Networks Learning/img/x.JPG -------------------------------------------------------------------------------- /Week 5 - Neural Networks Learning/img/y.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 5 - Neural Networks Learning/img/y.JPG -------------------------------------------------------------------------------- /Week 6 - Regularized Linear Regression and Bias v.s. Variance/Polynomial Regression.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "metadata": {}, 6 | "source": [ 7 | "# Polynomial Regression\n", 8 | "The problem with our linear model was that it was too simple for the data and resulted in underfitting (high bias). In this part of the exercise, you will address this problem by adding more features.

\n", 9 | "\n", 10 | "The file ex5data1 contains a data set which includes train set, test set, validation set.
\n", 11 | "The structure of the dataset described blow:
\n", 12 | "1. x = **Water level (a single feature)**\n", 13 | "2. y = **Value of flowed water**\n", 14 | "3. xval = **x validation set**\n", 15 | "4. yval = **y validation set**\n", 16 | "5. xtest = **x test set**\n", 17 | "6. ytest = **y test set**\n", 18 | "\n", 19 | "\n", 20 | "

\n", 21 | "\n", 22 | "Our assignment has these sections:\n", 23 | "1. Visualizing the Data\n", 24 | " 1. Converting .mat to .csv\n", 25 | " 2. Loading Dataset\n", 26 | " 3. Visualizing The Dataset\n", 27 | "2. Adding Polynomial Features\n", 28 | " 1. Adding Features\n", 29 | " 2. Normalizing Features\n", 30 | "3. Learning Polynomial Regression\n", 31 | " 1. Regularized Linear Regression Cost Function\n", 32 | " 2. Regularized Linear Regression Gradient\n", 33 | " 3. Fitting Linear Regression\n", 34 | " 4. Visualization of Fitted Model\n", 35 | "4. Adjusting The Regularization Parameter\n", 36 | " 1. \n", 37 | "5. Selecting λ Using a Cross Validation Set\n", 38 | " 1. \n", 39 | "6. Computing Test Set Error\n", 40 | " 1. \n", 41 | "7. Plotting Learning Curves With Randomly Selected Examples\n", 42 | " \n", 43 | "\n", 44 | "\n", 45 | "In each section full description provided." 46 | ] 47 | }, 48 | { 49 | "cell_type": "markdown", 50 | "metadata": {}, 51 | "source": [ 52 | "## 1. Visualizing the Dataset\n", 53 | "Before starting on any task, it is often useful to understand the data by visualizing it.
" 54 | ] 55 | }, 56 | { 57 | "cell_type": "markdown", 58 | "metadata": {}, 59 | "source": [ 60 | "### 1.A Converting .mat to .csv\n", 61 | "In this specific assignment, the instructor added a .mat file as training set and weights of trained neural network. But we have to convert it to .csv to use in python.
\n", 62 | "After all we now ready to import our new csv files to pandas dataframes and do preprocessing on it and make it ready for next steps." 63 | ] 64 | }, 65 | { 66 | "cell_type": "code", 67 | "execution_count": 1, 68 | "metadata": {}, 69 | "outputs": [], 70 | "source": [ 71 | "# import libraries\n", 72 | "import scipy.io\n", 73 | "import numpy as np\n", 74 | "\n", 75 | "data = scipy.io.loadmat(\"ex5data1\")" 76 | ] 77 | }, 78 | { 79 | "cell_type": "markdown", 80 | "metadata": {}, 81 | "source": [ 82 | "Now we **extract** `x`, `y`, `xval`, `yval`, `xtest` and `ytest` variables from the .mat file and save them into .csv file for further usage. After running the below code you should see:\n", 83 | "1. X.csv\n", 84 | "2. y.csv \n", 85 | "3. Xtest.csv\n", 86 | "4. ytest.csv\n", 87 | "5. Xval.csv\n", 88 | "6. yval.csv\n", 89 | "\n", 90 | "files in your directory." 91 | ] 92 | }, 93 | { 94 | "cell_type": "code", 95 | "execution_count": 2, 96 | "metadata": {}, 97 | "outputs": [], 98 | "source": [ 99 | "for i in data:\n", 100 | " if '__' not in i and 'readme' not in i:\n", 101 | " np.savetxt((i+\".csv\"),data[i],delimiter=',')" 102 | ] 103 | }, 104 | { 105 | "cell_type": "markdown", 106 | "metadata": {}, 107 | "source": [ 108 | "### 1.B Loading Dataset\n", 109 | "First we import .csv files into pandas dataframes then save them into numpy arrays.

" 110 | ] 111 | }, 112 | { 113 | "cell_type": "code", 114 | "execution_count": 3, 115 | "metadata": {}, 116 | "outputs": [], 117 | "source": [ 118 | "# import library\n", 119 | "import pandas as pd\n", 120 | "\n", 121 | "# saving .csv files to pandas dataframes\n", 122 | "x_df = pd.read_csv('X.csv',names= ['x'])\n", 123 | "xtest_df = pd.read_csv('Xtest.csv',names= ['xtest'])\n", 124 | "xval_df = pd.read_csv('Xval.csv',names= ['xval'])\n", 125 | "y_df = pd.read_csv('y.csv',names=['y'])\n", 126 | "ytest_df = pd.read_csv('ytest.csv',names= ['ytest'])\n", 127 | "yval_df = pd.read_csv('yval.csv',names= ['yval'])" 128 | ] 129 | }, 130 | { 131 | "cell_type": "code", 132 | "execution_count": 4, 133 | "metadata": {}, 134 | "outputs": [ 135 | { 136 | "data": { 137 | "text/html": [ 138 | "
\n", 139 | "\n", 152 | "\n", 153 | " \n", 154 | " \n", 155 | " \n", 156 | " \n", 157 | " \n", 158 | " \n", 159 | " \n", 160 | " \n", 161 | " \n", 162 | " \n", 163 | " \n", 164 | " \n", 165 | " \n", 166 | " \n", 167 | " \n", 168 | " \n", 169 | " \n", 170 | " \n", 171 | " \n", 172 | " \n", 173 | "
x
0-15.936758
1-29.152979
236.189549
\n", 174 | "
" 175 | ], 176 | "text/plain": [ 177 | " x\n", 178 | "0 -15.936758\n", 179 | "1 -29.152979\n", 180 | "2 36.189549" 181 | ] 182 | }, 183 | "execution_count": 4, 184 | "metadata": {}, 185 | "output_type": "execute_result" 186 | } 187 | ], 188 | "source": [ 189 | "x_df.head(3)" 190 | ] 191 | }, 192 | { 193 | "cell_type": "code", 194 | "execution_count": 5, 195 | "metadata": {}, 196 | "outputs": [ 197 | { 198 | "data": { 199 | "text/html": [ 200 | "
\n", 201 | "\n", 214 | "\n", 215 | " \n", 216 | " \n", 217 | " \n", 218 | " \n", 219 | " \n", 220 | " \n", 221 | " \n", 222 | " \n", 223 | " \n", 224 | " \n", 225 | " \n", 226 | " \n", 227 | " \n", 228 | " \n", 229 | " \n", 230 | " \n", 231 | " \n", 232 | " \n", 233 | " \n", 234 | " \n", 235 | "
y
02.134311
11.173257
234.359109
\n", 236 | "
" 237 | ], 238 | "text/plain": [ 239 | " y\n", 240 | "0 2.134311\n", 241 | "1 1.173257\n", 242 | "2 34.359109" 243 | ] 244 | }, 245 | "execution_count": 5, 246 | "metadata": {}, 247 | "output_type": "execute_result" 248 | } 249 | ], 250 | "source": [ 251 | "y_df.head(3)" 252 | ] 253 | }, 254 | { 255 | "cell_type": "markdown", 256 | "metadata": {}, 257 | "source": [ 258 | "Now we convert all **pandas dataframes** to **numpy arrays** for calculations." 259 | ] 260 | }, 261 | { 262 | "cell_type": "code", 263 | "execution_count": 6, 264 | "metadata": {}, 265 | "outputs": [ 266 | { 267 | "name": "stdout", 268 | "output_type": "stream", 269 | "text": [ 270 | "#12 Number of training samples, #1 features per sample\n", 271 | "#21 Number of validation samples, #1 features per sample\n", 272 | "#21 Number of test samples, #1 features per sample\n" 273 | ] 274 | } 275 | ], 276 | "source": [ 277 | "# saving x, y, xval, yval, xtest and ytest into numpy arrays\n", 278 | "x = x_df.iloc[:,:].values\n", 279 | "xval = xval_df.iloc[:,:].values\n", 280 | "xtest = xtest_df.iloc[:,:].values\n", 281 | "\n", 282 | "y = y_df.iloc[:,:].values\n", 283 | "yval = yval_df.iloc[:,:].values\n", 284 | "ytest = ytest_df.iloc[:,:].values\n", 285 | "\n", 286 | "# number of examples and number of features\n", 287 | "m, n = x.shape\n", 288 | "\n", 289 | "m_val = xval.shape[0]\n", 290 | "m_test = xtest.shape[0]\n", 291 | "\n", 292 | "print('#{} Number of training samples, #{} features per sample'.format(m,n))\n", 293 | "print('#{} Number of validation samples, #{} features per sample'.format(m_val,n))\n", 294 | "print('#{} Number of test samples, #{} features per sample'.format(m_test,n))" 295 | ] 296 | }, 297 | { 298 | "cell_type": "code", 299 | "execution_count": 7, 300 | "metadata": {}, 301 | "outputs": [], 302 | "source": [ 303 | "# define some hypter parameters\n", 304 | "\n", 305 | "# define theta as zero\n", 306 | "theta = None\n", 307 | "\n", 308 | "# define hyperparameter λ\n", 309 | "lambda_ = None\n", 310 | "\n", 311 | "# reshape (-1,1) because we just have one feature in y column\n", 312 | "y = y.reshape(-1,1)" 313 | ] 314 | }, 315 | { 316 | "cell_type": "markdown", 317 | "metadata": {}, 318 | "source": [ 319 | "### 1.C Ploting Dataset\n", 320 | "We will begin by visualizing the dataset containing historical records on **the change in the water level**, `x`, and **the amount of water flowing out of the dam**, `y`.

\n", 321 | "This dataset is divided into three parts:
\n", 322 | " • A **training set** that your model will learn on: `x`, `y`
\n", 323 | " • A **cross validation set** for determining the regularization parameter: `xval`, `yval`
\n", 324 | " • A **test set** for evaluating performance. These are **\"unseen\" examples** which your model did not see during training: `xtest`, `ytest`
" 325 | ] 326 | }, 327 | { 328 | "cell_type": "code", 329 | "execution_count": 9, 330 | "metadata": {}, 331 | "outputs": [ 332 | { 333 | "data": { 334 | "image/png": "\n", 335 | "text/plain": [ 336 | "
" 337 | ] 338 | }, 339 | "metadata": {}, 340 | "output_type": "display_data" 341 | } 342 | ], 343 | "source": [ 344 | "# import libraries\n", 345 | "import matplotlib.pyplot as plt\n", 346 | "%matplotlib inline\n", 347 | "\n", 348 | "plt.scatter(x, y, color='red', marker='x')\n", 349 | "plt.title('Training Set')\n", 350 | "plt.xlabel('Change in water level (x)')\n", 351 | "plt.ylabel('Water flowing out of the dam (y)')\n", 352 | "plt.grid()\n", 353 | "plt.show()" 354 | ] 355 | }, 356 | { 357 | "cell_type": "markdown", 358 | "metadata": {}, 359 | "source": [ 360 | "# 2. Adding Polynomial Features\n", 361 | "\n", 362 | "For use polynomial regression, our hypothesis has the form:\n", 363 | "Notice that by defining `x1 = (waterLevel)`, `x2 = (waterLevel)`2, ... , `xp = (waterLevel)`p, we obtain a linear regression model where the features are the various powers of the original value (waterLevel).

\n", 364 | "Now, you will **add more features using the higher powers** of the existing feature `x` in the dataset. Your task write a function so that the function **maps the original training set `x` of size `m × 1` into its higher powers**. Specifically, when a training set `x` of size `m × 1` is passed into the function, the **function should return a `m × p` matrix `x_poly`**, where column `1` holds the original values of `x`, column `2` holds the values of `x^2`, column `3` holds the values of `x^3`, and so on.
\n", 365 | "Note that **you don’t have to account for the zero-eth power in this function**." 366 | ] 367 | }, 368 | { 369 | "cell_type": "markdown", 370 | "metadata": {}, 371 | "source": [ 372 | "## 2.A Adding Features\n", 373 | "`poly_features(x, p)` takes a data matrix `x` (size `m x 1`) and **maps each example into its polynomial features** where
\n", 374 | "`x_poly[i, :] = [x(i) x(i)^2 x(i)^3 ... x(i)^p]`" 375 | ] 376 | }, 377 | { 378 | "cell_type": "code", 379 | "execution_count": 12, 380 | "metadata": {}, 381 | "outputs": [], 382 | "source": [ 383 | "x_poly = None # the output of polu_features\n", 384 | "p = 8 # order of polynomial features\n", 385 | "\n", 386 | "from sklearn.preprocessing import PolynomialFeatures # import libraries\n", 387 | "def poly_features(x,p): \n", 388 | " polynomial_features = PolynomialFeatures(degree=8, include_bias=False)\n", 389 | " x_poly = polynomial_features.fit_transform(x)\n", 390 | " return x_poly\n", 391 | " " 392 | ] 393 | }, 394 | { 395 | "cell_type": "code", 396 | "execution_count": 13, 397 | "metadata": {}, 398 | "outputs": [ 399 | { 400 | "data": { 401 | "text/html": [ 402 | "
\n", 403 | "\n", 416 | "\n", 417 | " \n", 418 | " \n", 419 | " \n", 420 | " \n", 421 | " \n", 422 | " \n", 423 | " \n", 424 | " \n", 425 | " \n", 426 | " \n", 427 | " \n", 428 | " \n", 429 | " \n", 430 | " \n", 431 | " \n", 432 | " \n", 433 | " \n", 434 | " \n", 435 | " \n", 436 | " \n", 437 | " \n", 438 | " \n", 439 | " \n", 440 | " \n", 441 | " \n", 442 | " \n", 443 | " \n", 444 | " \n", 445 | " \n", 446 | " \n", 447 | " \n", 448 | " \n", 449 | " \n", 450 | " \n", 451 | " \n", 452 | " \n", 453 | " \n", 454 | " \n", 455 | " \n", 456 | " \n", 457 | " \n", 458 | " \n", 459 | " \n", 460 | " \n", 461 | " \n", 462 | " \n", 463 | " \n", 464 | " \n", 465 | "
01234567
0-15.936758253.980260-4047.6219716.450597e+04-1.028016e+061.638324e+07-2.610958e+084.161020e+09
1-29.152979849.896197-24777.0061757.223235e+05-2.105788e+076.139000e+08-1.789701e+105.217513e+11
236.1895491309.68343047396.8521681.715271e+066.207487e+072.246462e+098.129843e+102.942154e+12
\n", 466 | "
" 467 | ], 468 | "text/plain": [ 469 | " 0 1 2 3 4 \\\n", 470 | "0 -15.936758 253.980260 -4047.621971 6.450597e+04 -1.028016e+06 \n", 471 | "1 -29.152979 849.896197 -24777.006175 7.223235e+05 -2.105788e+07 \n", 472 | "2 36.189549 1309.683430 47396.852168 1.715271e+06 6.207487e+07 \n", 473 | "\n", 474 | " 5 6 7 \n", 475 | "0 1.638324e+07 -2.610958e+08 4.161020e+09 \n", 476 | "1 6.139000e+08 -1.789701e+10 5.217513e+11 \n", 477 | "2 2.246462e+09 8.129843e+10 2.942154e+12 " 478 | ] 479 | }, 480 | "execution_count": 13, 481 | "metadata": {}, 482 | "output_type": "execute_result" 483 | } 484 | ], 485 | "source": [ 486 | "x_poly = poly_features(x,p)\n", 487 | "x_poly_df = pd.DataFrame(x_poly,columns=None)\n", 488 | "x_poly_df.head(3)" 489 | ] 490 | }, 491 | { 492 | "cell_type": "markdown", 493 | "metadata": {}, 494 | "source": [ 495 | "#### Now we add these features to `xtest` and `xval`" 496 | ] 497 | }, 498 | { 499 | "cell_type": "code", 500 | "execution_count": 14, 501 | "metadata": {}, 502 | "outputs": [ 503 | { 504 | "data": { 505 | "text/html": [ 506 | "
\n", 507 | "\n", 520 | "\n", 521 | " \n", 522 | " \n", 523 | " \n", 524 | " \n", 525 | " \n", 526 | " \n", 527 | " \n", 528 | " \n", 529 | " \n", 530 | " \n", 531 | " \n", 532 | " \n", 533 | " \n", 534 | " \n", 535 | " \n", 536 | " \n", 537 | " \n", 538 | " \n", 539 | " \n", 540 | " \n", 541 | " \n", 542 | " \n", 543 | " \n", 544 | " \n", 545 | " \n", 546 | " \n", 547 | " \n", 548 | " \n", 549 | " \n", 550 | " \n", 551 | " \n", 552 | " \n", 553 | " \n", 554 | " \n", 555 | " \n", 556 | " \n", 557 | " \n", 558 | " \n", 559 | " \n", 560 | " \n", 561 | " \n", 562 | " \n", 563 | " \n", 564 | " \n", 565 | " \n", 566 | " \n", 567 | " \n", 568 | " \n", 569 | "
01234567
0-16.746536280.446461-4696.5066867.865022e+04-1.317119e+062.205718e+07-3.693813e+086.185857e+09
1-14.577471212.502653-3097.7512154.515738e+04-6.582804e+059.596063e+06-1.398863e+082.039189e+09
234.5157591191.33759641119.9209321.419285e+064.898771e+071.690848e+095.836090e+102.014371e+12
\n", 570 | "
" 571 | ], 572 | "text/plain": [ 573 | " 0 1 2 3 4 \\\n", 574 | "0 -16.746536 280.446461 -4696.506686 7.865022e+04 -1.317119e+06 \n", 575 | "1 -14.577471 212.502653 -3097.751215 4.515738e+04 -6.582804e+05 \n", 576 | "2 34.515759 1191.337596 41119.920932 1.419285e+06 4.898771e+07 \n", 577 | "\n", 578 | " 5 6 7 \n", 579 | "0 2.205718e+07 -3.693813e+08 6.185857e+09 \n", 580 | "1 9.596063e+06 -1.398863e+08 2.039189e+09 \n", 581 | "2 1.690848e+09 5.836090e+10 2.014371e+12 " 582 | ] 583 | }, 584 | "execution_count": 14, 585 | "metadata": {}, 586 | "output_type": "execute_result" 587 | } 588 | ], 589 | "source": [ 590 | "xval_poly = poly_features(xval,p)\n", 591 | "xval_poly_df = pd.DataFrame(xval_poly,columns=None)\n", 592 | "xval_poly_df.head(3)" 593 | ] 594 | }, 595 | { 596 | "cell_type": "code", 597 | "execution_count": 15, 598 | "metadata": {}, 599 | "outputs": [ 600 | { 601 | "data": { 602 | "text/html": [ 603 | "
\n", 604 | "\n", 617 | "\n", 618 | " \n", 619 | " \n", 620 | " \n", 621 | " \n", 622 | " \n", 623 | " \n", 624 | " \n", 625 | " \n", 626 | " \n", 627 | " \n", 628 | " \n", 629 | " \n", 630 | " \n", 631 | " \n", 632 | " \n", 633 | " \n", 634 | " \n", 635 | " \n", 636 | " \n", 637 | " \n", 638 | " \n", 639 | " \n", 640 | " \n", 641 | " \n", 642 | " \n", 643 | " \n", 644 | " \n", 645 | " \n", 646 | " \n", 647 | " \n", 648 | " \n", 649 | " \n", 650 | " \n", 651 | " \n", 652 | " \n", 653 | " \n", 654 | " \n", 655 | " \n", 656 | " \n", 657 | " \n", 658 | " \n", 659 | " \n", 660 | " \n", 661 | " \n", 662 | " \n", 663 | " \n", 664 | " \n", 665 | " \n", 666 | "
01234567
0-33.3180041110.089390-36985.9627231.232298e+06-4.105772e+071.367961e+09-4.557774e+101.518559e+12
1-37.9121641437.332181-54492.3734212.065924e+06-7.832364e+072.969419e+09-1.125771e+114.268041e+12
2-51.2069382622.150494-134272.2976396.875673e+06-3.520822e+081.802905e+10-9.232124e+114.727488e+13
\n", 667 | "
" 668 | ], 669 | "text/plain": [ 670 | " 0 1 2 3 4 \\\n", 671 | "0 -33.318004 1110.089390 -36985.962723 1.232298e+06 -4.105772e+07 \n", 672 | "1 -37.912164 1437.332181 -54492.373421 2.065924e+06 -7.832364e+07 \n", 673 | "2 -51.206938 2622.150494 -134272.297639 6.875673e+06 -3.520822e+08 \n", 674 | "\n", 675 | " 5 6 7 \n", 676 | "0 1.367961e+09 -4.557774e+10 1.518559e+12 \n", 677 | "1 2.969419e+09 -1.125771e+11 4.268041e+12 \n", 678 | "2 1.802905e+10 -9.232124e+11 4.727488e+13 " 679 | ] 680 | }, 681 | "execution_count": 15, 682 | "metadata": {}, 683 | "output_type": "execute_result" 684 | } 685 | ], 686 | "source": [ 687 | "xtest_poly = poly_features(xtest,p)\n", 688 | "xtest_poly_df = pd.DataFrame(xtest_poly,columns=None)\n", 689 | "xtest_poly_df.head(3)" 690 | ] 691 | }, 692 | { 693 | "cell_type": "markdown", 694 | "metadata": {}, 695 | "source": [ 696 | "## 2.B Normalize Features\n", 697 | "It turns out that if we run the training directly on the projected data, will not work well as the **features** would be **badly scaled** (e.g., an example with **x = 40 will now have a feature x8 = 408 = 6.5 × 1012**).
\n", 698 | "Therefore, you will need to use **feature normalization**.\n", 699 | "`feature_normalize(x)` returns a **normalized version** of `x` where the **mean value of each feature is 0** and the **standard deviation is 1**. This is often a **good preprocessing step** to do when working with learning algorithms." 700 | ] 701 | }, 702 | { 703 | "cell_type": "code", 704 | "execution_count": 16, 705 | "metadata": {}, 706 | "outputs": [], 707 | "source": [ 708 | "def feature_normalize(x, xtest, xval):\n", 709 | " sigma = x.std()\n", 710 | " mean = x.mean()\n", 711 | " x_norm = (x-mean)/sigma\n", 712 | " xtest_norm = (xtest-mean)/sigma\n", 713 | " xval_norm = (xval-mean)/sigma\n", 714 | " return (x_norm, xtest_norm, xval_norm)" 715 | ] 716 | }, 717 | { 718 | "cell_type": "code", 719 | "execution_count": 17, 720 | "metadata": {}, 721 | "outputs": [], 722 | "source": [ 723 | "x_poly_norm, xtest_poly_norm, xval_poly_norm = feature_normalize(x_poly,xtest_poly, xval_poly)" 724 | ] 725 | }, 726 | { 727 | "cell_type": "code", 728 | "execution_count": 18, 729 | "metadata": {}, 730 | "outputs": [ 731 | { 732 | "name": "stdout", 733 | "output_type": "stream", 734 | "text": [ 735 | "x_poly_norm : mean= -1.850371707708594e-17, std=0.9999999999999999.\n", 736 | "xval_poly_norm : mean= 0.044848630228004685, std=1.2247731967735336.\n", 737 | "xtest_poly_norm : mean= 0.1606768875137592, std=2.5245490041714636.\n" 738 | ] 739 | } 740 | ], 741 | "source": [ 742 | "print('x_poly_norm : mean= {}, std={}.'.format(x_poly_norm.mean(),x_poly_norm.std()))\n", 743 | "print('xval_poly_norm : mean= {}, std={}.'.format(xval_poly_norm.mean(),xval_poly_norm.std()))\n", 744 | "print('xtest_poly_norm : mean= {}, std={}.'.format(xtest_poly_norm.mean(),xtest_poly_norm.std()))" 745 | ] 746 | }, 747 | { 748 | "cell_type": "markdown", 749 | "metadata": {}, 750 | "source": [ 751 | "Look at this [link](https://stackoverflow.com/questions/40405803/mean-of-data-scaled-with-sklearn-standardscaler-is-not-zero) if you have any question why after using **scaling**, we still do not have **mean = 0** and **std = 1**.
\n", 752 | "Actually the values are zero." 753 | ] 754 | }, 755 | { 756 | "cell_type": "code", 757 | "execution_count": 20, 758 | "metadata": {}, 759 | "outputs": [], 760 | "source": [ 761 | "# add 1's to the features of x as bias\n", 762 | "x_poly_norm = np.append(np.ones(shape=(m,1)),x_poly_norm,axis = 1)\n", 763 | "xval_poly_norm = np.append(np.ones(shape=(xval_poly_norm.shape[0],1)),xval_poly_norm,axis = 1)\n", 764 | "xtest_poly_norm = np.append(np.ones(shape=(xtest_poly_norm.shape[0],1)),xtest_poly_norm,axis = 1)" 765 | ] 766 | }, 767 | { 768 | "cell_type": "markdown", 769 | "metadata": {}, 770 | "source": [ 771 | "# 3. Learning Polynomial Regression\n", 772 | "We will proceed to **train polynomial regression using your linear regression cost function**.

\n", 773 | "Keep in mind that even though **we have polynomial terms** in our feature vector, we are **still solving a linear regression** optimization problem. The **polynomial terms have simply turned into features** that we can use for linear regression. We are using the **same cost function and gradient** that you wrote for the earlier part of this exercise.
" 774 | ] 775 | }, 776 | { 777 | "cell_type": "markdown", 778 | "metadata": {}, 779 | "source": [ 780 | "## 3.A Regularized Linear Regression Cost Function\n", 781 | "Recall that regularized linear regression has the following cost function:

\n", 782 | "where `lambda` is a regularization parameter which controls the degree of regularization (thus, **help preventing overfitting**). The **regularization** term puts a **penalty** on the overal **cost J**.

\n", 783 | "As the magnitudes of the model parameters **θj**\n", 784 | "increase, the penalty increases as well. Note that you should not regularize the **θ0** term.

\n", 785 | "For this part of the exercise, you will be using a **polynomial of degree 8**.
\n", 786 | "After learning the parameters **θ**, you should draw two plots generated for polynomial regression with **λ = 0**.
" 787 | ] 788 | }, 789 | { 790 | "cell_type": "markdown", 791 | "metadata": {}, 792 | "source": [ 793 | "### Implementation\n", 794 | "`linear_reg_cost(x, y, theta, lambda_)` computes the cost of using `theta` as the parameter for linear regression to fit the data points in `x` and `y`. Returns the cost in `j` as cost." 795 | ] 796 | }, 797 | { 798 | "cell_type": "code", 799 | "execution_count": 22, 800 | "metadata": {}, 801 | "outputs": [], 802 | "source": [ 803 | "def hypothesis(x,theta):\n", 804 | " return np.dot(x,theta)" 805 | ] 806 | }, 807 | { 808 | "cell_type": "code", 809 | "execution_count": 23, 810 | "metadata": {}, 811 | "outputs": [], 812 | "source": [ 813 | "def linear_reg_cost(theta_flatten, x_flatten, y, lambda_, num_of_samples, num_of_features):\n", 814 | " x = x_flatten.reshape(num_of_samples, num_of_features)\n", 815 | " theta = theta_flatten.reshape(n,1)\n", 816 | " loss = hypothesis(x,theta)-y\n", 817 | " regularizer = lambda_*np.sum(theta[1:,:]**2)/(2*m)\n", 818 | " j = np.sum(loss ** 2)/(2*m) \n", 819 | " return j" 820 | ] 821 | }, 822 | { 823 | "cell_type": "markdown", 824 | "metadata": {}, 825 | "source": [ 826 | "## 3.B Regularized Linear Regression Gradient\n", 827 | "Correspondingly, the **partial derivative of regularized linear regression’s cost for θj** is defined as:" 828 | ] 829 | }, 830 | { 831 | "cell_type": "markdown", 832 | "metadata": {}, 833 | "source": [ 834 | "### Implementation\n", 835 | "`linear_reg_grad(x, y, theta, lambda_)` computes the gradient of cost of using `theta` as the parameter for linear regression to fit the data points in `x` and `y`. Returns the gradient in `grad`." 836 | ] 837 | }, 838 | { 839 | "cell_type": "code", 840 | "execution_count": 24, 841 | "metadata": {}, 842 | "outputs": [], 843 | "source": [ 844 | "def linear_reg_grad(theta_flatten, x_flatten, y, lambda_, num_of_samples, num_of_features):\n", 845 | " x = x_flatten.reshape(num_of_samples, num_of_features)\n", 846 | " m,n = x.shape\n", 847 | " theta = theta_flatten.reshape(n,1)\n", 848 | " new_theta = np.zeros(shape=(theta.shape))\n", 849 | " loss = hypothesis(x,theta)-y\n", 850 | " gradient = np.dot(x.T,loss)\n", 851 | " new_theta[0:,:] = gradient/m\n", 852 | " new_theta[1:,:] = gradient[1:,:]/m + lambda_*(theta[1:,]/m)\n", 853 | " return new_theta.flatten()" 854 | ] 855 | }, 856 | { 857 | "cell_type": "markdown", 858 | "metadata": {}, 859 | "source": [ 860 | "## 3.C Fitting Linear Regression\n", 861 | "Once your cost function and gradient are working correctly, the next part is to **compute the optimal values** of **θ**.
\n", 862 | "This training function uses `fmin_cg` to optimize the cost function. See official doc
" 863 | ] 864 | }, 865 | { 866 | "cell_type": "markdown", 867 | "metadata": {}, 868 | "source": [ 869 | "### Implementation\n", 870 | "Once you have implemented the cost and gradient correctly, the `fmin_cg` function will use your cost function to train regularized linear regression and update theta each time." 871 | ] 872 | }, 873 | { 874 | "cell_type": "code", 875 | "execution_count": 28, 876 | "metadata": {}, 877 | "outputs": [ 878 | { 879 | "name": "stdout", 880 | "output_type": "stream", 881 | "text": [ 882 | "Optimization terminated successfully.\n", 883 | " Current function value: 15.795185\n", 884 | " Iterations: 198\n", 885 | " Function evaluations: 454\n", 886 | " Gradient evaluations: 454\n" 887 | ] 888 | } 889 | ], 890 | "source": [ 891 | "m,n = x_poly_norm.shape\n", 892 | "lambda_ = 0\n", 893 | "theta = np.ones(n)\n", 894 | "\n", 895 | "from scipy.optimize import fmin_cg\n", 896 | "new_theta = fmin_cg(f=linear_reg_cost, x0=theta, fprime=linear_reg_grad, args=(x_poly_norm.flatten(), y, lambda_, m,n))" 897 | ] 898 | }, 899 | { 900 | "cell_type": "code", 901 | "execution_count": 31, 902 | "metadata": {}, 903 | "outputs": [ 904 | { 905 | "data": { 906 | "text/plain": [ 907 | "array([ 286.25746025, -46.25445386, -46.25037961, -45.57463053,\n", 908 | " -44.4634646 , 229.73026807, 1062.20194521, 561.40028703,\n", 909 | " 10.76226527])" 910 | ] 911 | }, 912 | "execution_count": 31, 913 | "metadata": {}, 914 | "output_type": "execute_result" 915 | } 916 | ], 917 | "source": [ 918 | "new_theta" 919 | ] 920 | }, 921 | { 922 | "cell_type": "markdown", 923 | "metadata": {}, 924 | "source": [ 925 | "## 3.D Visualization of Fitted Model\n", 926 | "Finally, you should also **plot the best fit line**. The best fit line tells us that the model is a good fit to the data because the **data has a non-linear pattern**. While **visualizing the best fit** as shown is **one possible way to debug** your learning algorithm, it is not always easy to visualize the data and model.

\n", 927 | "In the next section, you will implement a function to **generate learning curves** that can help you debug your learning algorithm even if it is **not easy to visualize** the data." 928 | ] 929 | }, 930 | { 931 | "cell_type": "code", 932 | "execution_count": 43, 933 | "metadata": {}, 934 | "outputs": [ 935 | { 936 | "data": { 937 | "image/png": "\n", 938 | "text/plain": [ 939 | "
" 940 | ] 941 | }, 942 | "metadata": {}, 943 | "output_type": "display_data" 944 | } 945 | ], 946 | "source": [ 947 | "# import libraries\n", 948 | "import matplotlib.pyplot as plt\n", 949 | "%matplotlib inline\n", 950 | "\n", 951 | "plt.scatter(x, y, color='red', marker='x', label= 'train data')\n", 952 | "plt.plot(x.flatten(),np.dot(x_poly_norm,new_theta.reshape(n,1).flatten()), label = 'best fit model')\n", 953 | "#plt.axis([-40,50,-75,75])\n", 954 | "plt.title('Training Set')\n", 955 | "plt.xlabel('Change in water level (x)')\n", 956 | "plt.ylabel('Water flowing out of the dam (y)')\n", 957 | "plt.grid()\n", 958 | "plt.legend()\n", 959 | "plt.show()" 960 | ] 961 | } 962 | ], 963 | "metadata": { 964 | "kernelspec": { 965 | "display_name": "Python 3", 966 | "language": "python", 967 | "name": "python3" 968 | }, 969 | "language_info": { 970 | "codemirror_mode": { 971 | "name": "ipython", 972 | "version": 3 973 | }, 974 | "file_extension": ".py", 975 | "mimetype": "text/x-python", 976 | "name": "python", 977 | "nbconvert_exporter": "python", 978 | "pygments_lexer": "ipython3", 979 | "version": "3.6.6" 980 | } 981 | }, 982 | "nbformat": 4, 983 | "nbformat_minor": 2 984 | } 985 | -------------------------------------------------------------------------------- /Week 6 - Regularized Linear Regression and Bias v.s. Variance/Regularized Linear Regression.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "metadata": {}, 6 | "source": [ 7 | "# Regularized Linear Regression\n", 8 | "\n", 9 | "In the first half of the exercise, you will implement regularized linear regression to predict the amount of water flowing out of a dam using the change of water level in a reservoir. In the next half, you will go through some **diagnostics of debugging learning algorithms** and examine the **effects of bias v.s. variance.**

\n", 10 | "In the following parts, you will implement linear regression and use that to fit a **straight line** to the data and plot learning curves. Following that, you will implement **polynomial regression** to find a **better fit** to the data.\n", 11 | "\n", 12 | "The file ex5data1 contains a data set which includes train set, test set, validation set.
\n", 13 | "The structure of the dataset described blow:
\n", 14 | "1. x = **Water level (a single feature)**\n", 15 | "2. y = **Value of flowed water**\n", 16 | "3. xval = **x validation set**\n", 17 | "4. yval = **y validation set**\n", 18 | "5. xtest = **x test set**\n", 19 | "6. ytest = **y test set**\n", 20 | "\n", 21 | "\n", 22 | "

\n", 23 | "\n", 24 | "Our assignment has these sections:\n", 25 | "1. Visualizing the Data\n", 26 | " 1. Converting .mat to .csv\n", 27 | " 2. Loading Dataset\n", 28 | " 3. Visualizing The Dataset\n", 29 | "2. Regularized Linear Regression Cost Function\n", 30 | " 1. Implementation\n", 31 | " 2. Test Cost Function\n", 32 | "3. Regularized Linear Regression Gradient\n", 33 | " 1. Implementation\n", 34 | " 2. Test Gradient Function\n", 35 | "4. Fitting Linear Regression\n", 36 | " 1. Implementation\n", 37 | " 2. Visualziation of Fitted Model\n", 38 | "5. Bias-variance\n", 39 | " 1. Learning Curves\n", 40 | " 2. Ploting Learning Curve\n", 41 | " \n", 42 | "\n", 43 | "\n", 44 | "In each section full description provided." 45 | ] 46 | }, 47 | { 48 | "cell_type": "markdown", 49 | "metadata": {}, 50 | "source": [ 51 | "## 1. Visualizing the Dataset\n", 52 | "Before starting on any task, it is often useful to understand the data by visualizing it.
" 53 | ] 54 | }, 55 | { 56 | "cell_type": "markdown", 57 | "metadata": {}, 58 | "source": [ 59 | "### 1.A Converting .mat to .csv\n", 60 | "In this specific assignment, the instructor added a .mat file as training set and weights of trained neural network. But we have to convert it to .csv to use in python.
\n", 61 | "After all we now ready to import our new csv files to pandas dataframes and do preprocessing on it and make it ready for next steps." 62 | ] 63 | }, 64 | { 65 | "cell_type": "code", 66 | "execution_count": 1, 67 | "metadata": {}, 68 | "outputs": [], 69 | "source": [ 70 | "# import libraries\n", 71 | "import scipy.io\n", 72 | "import numpy as np\n", 73 | "\n", 74 | "data = scipy.io.loadmat(\"ex5data1\")" 75 | ] 76 | }, 77 | { 78 | "cell_type": "markdown", 79 | "metadata": {}, 80 | "source": [ 81 | "Now we **extract** `x`, `y`, `xval`, `yval`, `xtest` and `ytest` variables from the .mat file and save them into .csv file for further usage. After running the below code you should see:\n", 82 | "1. X.csv\n", 83 | "2. y.csv \n", 84 | "3. Xtest.csv\n", 85 | "4. ytest.csv\n", 86 | "5. Xval.csv\n", 87 | "6. yval.csv\n", 88 | "\n", 89 | "files in your directory." 90 | ] 91 | }, 92 | { 93 | "cell_type": "code", 94 | "execution_count": 2, 95 | "metadata": {}, 96 | "outputs": [], 97 | "source": [ 98 | "for i in data:\n", 99 | " if '__' not in i and 'readme' not in i:\n", 100 | " np.savetxt((i+\".csv\"),data[i],delimiter=',')" 101 | ] 102 | }, 103 | { 104 | "cell_type": "markdown", 105 | "metadata": {}, 106 | "source": [ 107 | "### 1.B Loading Dataset\n", 108 | "First we import .csv files into pandas dataframes then save them into numpy arrays.

" 109 | ] 110 | }, 111 | { 112 | "cell_type": "code", 113 | "execution_count": 3, 114 | "metadata": {}, 115 | "outputs": [], 116 | "source": [ 117 | "# import library\n", 118 | "import pandas as pd\n", 119 | "\n", 120 | "# saving .csv files to pandas dataframes\n", 121 | "x_df = pd.read_csv('X.csv',names= ['x'])\n", 122 | "xtest_df = pd.read_csv('Xtest.csv',names= ['xtest'])\n", 123 | "xval_df = pd.read_csv('Xval.csv',names= ['xval'])\n", 124 | "y_df = pd.read_csv('y.csv',names=['y'])\n", 125 | "ytest_df = pd.read_csv('ytest.csv',names= ['ytest'])\n", 126 | "yval_df = pd.read_csv('yval.csv',names= ['yval'])" 127 | ] 128 | }, 129 | { 130 | "cell_type": "code", 131 | "execution_count": 4, 132 | "metadata": {}, 133 | "outputs": [ 134 | { 135 | "data": { 136 | "text/html": [ 137 | "
\n", 138 | "\n", 151 | "\n", 152 | " \n", 153 | " \n", 154 | " \n", 155 | " \n", 156 | " \n", 157 | " \n", 158 | " \n", 159 | " \n", 160 | " \n", 161 | " \n", 162 | " \n", 163 | " \n", 164 | " \n", 165 | " \n", 166 | " \n", 167 | " \n", 168 | " \n", 169 | " \n", 170 | " \n", 171 | " \n", 172 | "
x
0-15.936758
1-29.152979
236.189549
\n", 173 | "
" 174 | ], 175 | "text/plain": [ 176 | " x\n", 177 | "0 -15.936758\n", 178 | "1 -29.152979\n", 179 | "2 36.189549" 180 | ] 181 | }, 182 | "execution_count": 4, 183 | "metadata": {}, 184 | "output_type": "execute_result" 185 | } 186 | ], 187 | "source": [ 188 | "x_df.head(3)" 189 | ] 190 | }, 191 | { 192 | "cell_type": "code", 193 | "execution_count": 5, 194 | "metadata": {}, 195 | "outputs": [ 196 | { 197 | "data": { 198 | "text/html": [ 199 | "
\n", 200 | "\n", 213 | "\n", 214 | " \n", 215 | " \n", 216 | " \n", 217 | " \n", 218 | " \n", 219 | " \n", 220 | " \n", 221 | " \n", 222 | " \n", 223 | " \n", 224 | " \n", 225 | " \n", 226 | " \n", 227 | " \n", 228 | " \n", 229 | " \n", 230 | " \n", 231 | " \n", 232 | " \n", 233 | " \n", 234 | "
y
02.134311
11.173257
234.359109
\n", 235 | "
" 236 | ], 237 | "text/plain": [ 238 | " y\n", 239 | "0 2.134311\n", 240 | "1 1.173257\n", 241 | "2 34.359109" 242 | ] 243 | }, 244 | "execution_count": 5, 245 | "metadata": {}, 246 | "output_type": "execute_result" 247 | } 248 | ], 249 | "source": [ 250 | "y_df.head(3)" 251 | ] 252 | }, 253 | { 254 | "cell_type": "markdown", 255 | "metadata": {}, 256 | "source": [ 257 | "Now we convert all **pandas dataframes** to **numpy arrays** for calculations." 258 | ] 259 | }, 260 | { 261 | "cell_type": "code", 262 | "execution_count": 6, 263 | "metadata": {}, 264 | "outputs": [ 265 | { 266 | "name": "stdout", 267 | "output_type": "stream", 268 | "text": [ 269 | "#12 Number of training samples, #1 features per sample\n", 270 | "#21 Number of validation samples, #1 features per sample\n", 271 | "#21 Number of test samples, #1 features per sample\n" 272 | ] 273 | } 274 | ], 275 | "source": [ 276 | "# saving x, y, xval, yval, xtest and ytest into numpy arrays\n", 277 | "x = x_df.iloc[:,:].values\n", 278 | "xval = xval_df.iloc[:,:].values\n", 279 | "xtest = xtest_df.iloc[:,:].values\n", 280 | "\n", 281 | "y = y_df.iloc[:,:].values\n", 282 | "yval = yval_df.iloc[:,:].values\n", 283 | "ytest = ytest_df.iloc[:,:].values\n", 284 | "\n", 285 | "# number of examples and number of features\n", 286 | "m, n = x.shape\n", 287 | "\n", 288 | "# add 1's to the features of x as bias\n", 289 | "x = np.append(np.ones(shape=(m,1)),x,axis = 1)\n", 290 | "xval = np.append(np.ones(shape=(xval.shape[0],1)),xval,axis = 1)\n", 291 | "xtest = np.append(np.ones(shape=(xtest.shape[0],1)),xtest,axis = 1)\n", 292 | "\n", 293 | "\n", 294 | "\n", 295 | "m_val = xval.shape[0]\n", 296 | "m_test = xtest.shape[0]\n", 297 | "\n", 298 | "print('#{} Number of training samples, #{} features per sample'.format(m,n))\n", 299 | "print('#{} Number of validation samples, #{} features per sample'.format(m_val,n))\n", 300 | "print('#{} Number of test samples, #{} features per sample'.format(m_test,n))" 301 | ] 302 | }, 303 | { 304 | "cell_type": "code", 305 | "execution_count": 7, 306 | "metadata": {}, 307 | "outputs": [], 308 | "source": [ 309 | "# define some hypter parameters\n", 310 | "\n", 311 | "# define theta as zero\n", 312 | "theta = None\n", 313 | "\n", 314 | "# define hyperparameter λ\n", 315 | "lambda_ = None\n", 316 | "\n", 317 | "# reshape (-1,1) because we just have one feature in y column\n", 318 | "y = y.reshape(-1,1)" 319 | ] 320 | }, 321 | { 322 | "cell_type": "markdown", 323 | "metadata": {}, 324 | "source": [ 325 | "### 1.C Ploting Dataset\n", 326 | "We will begin by visualizing the dataset containing historical records on **the change in the water level**, `x`, and **the amount of water flowing out of the dam**, `y`.

\n", 327 | "This dataset is divided into three parts:
\n", 328 | " • A **training set** that your model will learn on: `x`, `y`
\n", 329 | " • A **cross validation set** for determining the regularization parameter: `xval`, `yval`
\n", 330 | " • A **test set** for evaluating performance. These are **\"unseen\" examples** which your model did not see during training: `xtest`, `ytest`
" 331 | ] 332 | }, 333 | { 334 | "cell_type": "code", 335 | "execution_count": 8, 336 | "metadata": {}, 337 | "outputs": [ 338 | { 339 | "data": { 340 | "image/png": "\n", 341 | "text/plain": [ 342 | "
" 343 | ] 344 | }, 345 | "metadata": {}, 346 | "output_type": "display_data" 347 | } 348 | ], 349 | "source": [ 350 | "# import libraries\n", 351 | "import matplotlib.pyplot as plt\n", 352 | "%matplotlib inline\n", 353 | "\n", 354 | "plt.scatter(x[:,1], y, color='red', marker='x')\n", 355 | "plt.title('Training Set')\n", 356 | "plt.xlabel('Change in water level (x)')\n", 357 | "plt.ylabel('Water flowing out of the dam (y)')\n", 358 | "plt.grid()\n", 359 | "plt.show()" 360 | ] 361 | }, 362 | { 363 | "cell_type": "markdown", 364 | "metadata": {}, 365 | "source": [ 366 | "# 2 Regularized Linear Regression Cost Function\n", 367 | "Recall that regularized linear regression has the following cost function:

\n", 368 | "where `lambda` is a regularization parameter which controls the degree of regularization (thus, **help preventing overfitting**). The **regularization** term puts a **penalty** on the overal **cost J**.

\n", 369 | "As the magnitudes of the model parameters **θj**\n", 370 | "increase, the penalty increases as well. Note that you should not regularize the **θ0** term.

\n", 371 | "\n", 372 | "**Your task is to write a function to calculate the regularized linear regression cost function. If possible, try to vectorize your code and avoid writing loops.**" 373 | ] 374 | }, 375 | { 376 | "cell_type": "markdown", 377 | "metadata": {}, 378 | "source": [ 379 | "# 2.A Implementation\n", 380 | "`linear_reg_cost(x, y, theta, lambda_)` computes the cost of using `theta` as the parameter for linear regression to fit the data points in `x` and `y`. Returns the cost in `j` as cost." 381 | ] 382 | }, 383 | { 384 | "cell_type": "code", 385 | "execution_count": 9, 386 | "metadata": {}, 387 | "outputs": [], 388 | "source": [ 389 | "def hypothesis(x,theta):\n", 390 | " return np.dot(x,theta)" 391 | ] 392 | }, 393 | { 394 | "cell_type": "code", 395 | "execution_count": 10, 396 | "metadata": {}, 397 | "outputs": [], 398 | "source": [ 399 | "def linear_reg_cost(theta_flatten, x_flatten, y, lambda_, num_of_samples, num_of_features):\n", 400 | " x = x_flatten.reshape(num_of_samples, num_of_features)\n", 401 | " theta = theta_flatten.reshape(n,1)\n", 402 | " loss = hypothesis(x,theta)-y\n", 403 | " regularizer = lambda_*np.sum(theta[1:,:]**2)/(2*m)\n", 404 | " j = np.sum(loss ** 2)/(2*m) \n", 405 | " return j" 406 | ] 407 | }, 408 | { 409 | "cell_type": "markdown", 410 | "metadata": {}, 411 | "source": [ 412 | "## 2.B Test Cost Function\n", 413 | "Cost at `theta` = [1,1] should be about **303.993192**" 414 | ] 415 | }, 416 | { 417 | "cell_type": "code", 418 | "execution_count": 11, 419 | "metadata": {}, 420 | "outputs": [ 421 | { 422 | "data": { 423 | "text/plain": [ 424 | "303.95152555359761" 425 | ] 426 | }, 427 | "execution_count": 11, 428 | "metadata": {}, 429 | "output_type": "execute_result" 430 | } 431 | ], 432 | "source": [ 433 | "m,n = x.shape\n", 434 | "theta = np.ones(n)\n", 435 | "lambda_= 1\n", 436 | "linear_reg_cost(theta.flatten(), x.flatten(),y,lambda_,m,n)" 437 | ] 438 | }, 439 | { 440 | "cell_type": "markdown", 441 | "metadata": {}, 442 | "source": [ 443 | "compute_gradient(theta, x, y,lambda): computes the gradient of the cost using theta as the parameter." 444 | ] 445 | }, 446 | { 447 | "cell_type": "markdown", 448 | "metadata": {}, 449 | "source": [ 450 | "# 3. Regularized Linear Regression Gradient\n", 451 | "Correspondingly, the **partial derivative of regularized linear regression’s cost for θj** is defined as:" 452 | ] 453 | }, 454 | { 455 | "cell_type": "markdown", 456 | "metadata": {}, 457 | "source": [ 458 | "## 3.A Implementation" 459 | ] 460 | }, 461 | { 462 | "cell_type": "markdown", 463 | "metadata": {}, 464 | "source": [ 465 | "`linear_reg_grad(x, y, theta, lambda_)` computes the gradient of cost of using `theta` as the parameter for linear regression to fit the data points in `x` and `y`. Returns the gradient in `grad`." 466 | ] 467 | }, 468 | { 469 | "cell_type": "code", 470 | "execution_count": 12, 471 | "metadata": {}, 472 | "outputs": [], 473 | "source": [ 474 | "def linear_reg_grad(theta_flatten, x_flatten, y, lambda_, num_of_samples, num_of_features):\n", 475 | " x = x_flatten.reshape(num_of_samples, num_of_features)\n", 476 | " m,n = x.shape\n", 477 | " theta = theta_flatten.reshape(n,1)\n", 478 | " new_theta = np.zeros(shape=(theta.shape))\n", 479 | " loss = hypothesis(x,theta)-y\n", 480 | " gradient = np.dot(x.T,loss)\n", 481 | " new_theta[0:,:] = gradient/m\n", 482 | " new_theta[1:,:] = gradient[1:,:]/m + lambda_*(theta[1:,]/m)\n", 483 | " return new_theta.flatten()" 484 | ] 485 | }, 486 | { 487 | "cell_type": "markdown", 488 | "metadata": {}, 489 | "source": [ 490 | "## 3.B Test Gradient Function\n", 491 | "Run your gradient function using `theta = [1; 1]`, You should expect to see a `gradient = [-15.30; 598.250]`." 492 | ] 493 | }, 494 | { 495 | "cell_type": "code", 496 | "execution_count": 13, 497 | "metadata": {}, 498 | "outputs": [], 499 | "source": [ 500 | "theta = np.ones(n)\n", 501 | "lambda_ = 0\n", 502 | "grad = linear_reg_grad(theta,x.flatten(),y,lambda_,m,n)" 503 | ] 504 | }, 505 | { 506 | "cell_type": "code", 507 | "execution_count": 14, 508 | "metadata": {}, 509 | "outputs": [ 510 | { 511 | "data": { 512 | "text/plain": [ 513 | "array([ -15.30301567, 598.16741084])" 514 | ] 515 | }, 516 | "execution_count": 14, 517 | "metadata": {}, 518 | "output_type": "execute_result" 519 | } 520 | ], 521 | "source": [ 522 | "grad" 523 | ] 524 | }, 525 | { 526 | "cell_type": "markdown", 527 | "metadata": {}, 528 | "source": [ 529 | "# 4. Fitting Linear Regression\n", 530 | "Once your cost function and gradient are working correctly, the next part is to **compute the optimal values** of **θ**.
\n", 531 | "This training function uses `fmin_cg` to optimize the cost function. See official doc
\n", 532 | "In this part, we set regularization parameter **λ** to **zero**. Because our current implementation of linear regression is trying to fit a 2-dimensional **θ**, regularization will not be incredibly helpful for a **θ** of such **low dimension**.
\n", 533 | "In the later parts of the exercise, you will be using **polynomial regression with regularization**." 534 | ] 535 | }, 536 | { 537 | "cell_type": "markdown", 538 | "metadata": {}, 539 | "source": [ 540 | "## 4.A Implementation\n", 541 | "Once you have implemented the cost and gradient correctly, the `fmin_cg` function will use your cost function to train regularized linear regression and update theta each time." 542 | ] 543 | }, 544 | { 545 | "cell_type": "code", 546 | "execution_count": 15, 547 | "metadata": {}, 548 | "outputs": [ 549 | { 550 | "name": "stdout", 551 | "output_type": "stream", 552 | "text": [ 553 | "Optimization terminated successfully.\n", 554 | " Current function value: 22.373906\n", 555 | " Iterations: 18\n", 556 | " Function evaluations: 28\n", 557 | " Gradient evaluations: 28\n" 558 | ] 559 | } 560 | ], 561 | "source": [ 562 | "theta = np.ones(n)\n", 563 | "\n", 564 | "from scipy.optimize import fmin_cg\n", 565 | "new_theta = fmin_cg(f=linear_reg_cost, x0=theta, fprime=linear_reg_grad, args=(x.flatten(), y, lambda_, m,n))" 566 | ] 567 | }, 568 | { 569 | "cell_type": "code", 570 | "execution_count": 16, 571 | "metadata": {}, 572 | "outputs": [ 573 | { 574 | "data": { 575 | "text/plain": [ 576 | "array([ 13.08790734, 0.36777925])" 577 | ] 578 | }, 579 | "execution_count": 16, 580 | "metadata": {}, 581 | "output_type": "execute_result" 582 | } 583 | ], 584 | "source": [ 585 | "new_theta" 586 | ] 587 | }, 588 | { 589 | "cell_type": "markdown", 590 | "metadata": {}, 591 | "source": [ 592 | "## 4.B Visualization of Fitted Model\n", 593 | "Finally, you should also **plot the best fit line**. The best fit line tells us that the model is not a good fit to the data because the **data has a non-linear pattern**. While **visualizing the best fit** as shown is **one possible way to debug** your learning algorithm, it is not always easy to visualize the data and model.

\n", 594 | "In the next section, you will implement a function to **generate learning curves** that can help you debug your learning algorithm even if it is **not easy to visualize** the data." 595 | ] 596 | }, 597 | { 598 | "cell_type": "code", 599 | "execution_count": 17, 600 | "metadata": {}, 601 | "outputs": [ 602 | { 603 | "data": { 604 | "image/png": "\n", 605 | "text/plain": [ 606 | "
" 607 | ] 608 | }, 609 | "metadata": {}, 610 | "output_type": "display_data" 611 | } 612 | ], 613 | "source": [ 614 | "# import libraries\n", 615 | "import matplotlib.pyplot as plt\n", 616 | "%matplotlib inline\n", 617 | "\n", 618 | "plt.scatter(x[:,1], y, color='red', marker='x', label= 'train data')\n", 619 | "plt.plot(x[:,1],np.dot(x,new_theta.reshape(n,1)), label = 'best fit model')\n", 620 | "plt.title('Training Set')\n", 621 | "plt.xlabel('Change in water level (x)')\n", 622 | "plt.ylabel('Water flowing out of the dam (y)')\n", 623 | "plt.grid()\n", 624 | "plt.legend()\n", 625 | "plt.show()" 626 | ] 627 | }, 628 | { 629 | "cell_type": "markdown", 630 | "metadata": {}, 631 | "source": [ 632 | "# 5. Bias-Variance\n", 633 | "An important concept in machine learning is the **bias-variance tradeoff**. Models with **high bias** are not complex enough for the data and tend to **underfit**, while models with **high variance** **overfit** to the training data.
\n", 634 | "In this part of the exercise, you will plot training and test errors on a learning curve to diagnose bias-variance problems." 635 | ] 636 | }, 637 | { 638 | "cell_type": "markdown", 639 | "metadata": {}, 640 | "source": [ 641 | "## 5.1 Learning Curves\n", 642 | "You will now implement code to generate the learning curves that will be useful in debugging learning algorithms. Recall that a learning curve **plots training and cross validation error as a function of training set size.**
\n", 643 | "To plot the learning curve, we need a training and cross validation set error for **different training set** sizes. To obtain different training set sizes, you should use **different subsets** of the original training set `x`. Specifically, for a training set size of `i`, **you should use the first `i` examples **(i.e., `X[1:i,:]` and `y[1:i]`).

\n", 644 | "You can use the `fmin_cg` function to find the `θ` parameters. Note that the `lambda` is passed as a parameter to the `learning_curve` function. After learning the `θ` parameters, you should **compute the error on the training and cross validation sets.** Recall that the **training error** for a dataset is defined as:
\n", 645 | "\n", 646 | "In particular, note that the **training error does not include the regularization** term. One way to compute the training error is to **use your existing cost function and set `λ` to `0`** only when using it to compute the training error and cross validation error.
\n", 647 | "When you are **computing the training set error**, make sure you compute it on the **training subset (i.e., `x[1:n,:]` and `y[1:n]`)** (instead of the entire training set). However, for the **cross validation error**, you should compute it over the **entire cross validation set**. You should store the computed errors in the vectors `error_train` and `error_val`." 648 | ] 649 | }, 650 | { 651 | "cell_type": "markdown", 652 | "metadata": {}, 653 | "source": [ 654 | "`learning_curve(x, y, xval, yval, lambda_)` **returns the train and cross validation set errors for a learning curve**.

In particular, it returns two vectors of the same length - `error_train` and `error_val`. Then, `error_train[i]` contains the training error for `i` examples (and similarly for `error_val[i]`)." 655 | ] 656 | }, 657 | { 658 | "cell_type": "code", 659 | "execution_count": 18, 660 | "metadata": {}, 661 | "outputs": [], 662 | "source": [ 663 | "error_train = np.zeros(m)\n", 664 | "error_val = np.zeros(m)\n", 665 | "\n", 666 | "lambda_ = 1" 667 | ] 668 | }, 669 | { 670 | "cell_type": "code", 671 | "execution_count": 38, 672 | "metadata": {}, 673 | "outputs": [], 674 | "source": [ 675 | "def train_val_error(x, y, xval, yval, lambda_):\n", 676 | " m,n = x.shape\n", 677 | " theta = np.ones(n) # initialize theta for each time of training with subset of training set.\n", 678 | " new_theta = fmin_cg(f=linear_reg_cost, x0=theta, fprime=linear_reg_grad, args=(x.flatten(), y, lambda_, m,n))\n", 679 | " t_error = linear_reg_cost(new_theta.flatten(), x.flatten(), y, 0, x.shape[0], x.shape[1])\n", 680 | " v_error = linear_reg_cost(new_theta.flatten(), xval.flatten(), yval, 0, xval.shape[0], xval.shape[1])\n", 681 | " return (t_error, v_error)" 682 | ] 683 | }, 684 | { 685 | "cell_type": "code", 686 | "execution_count": 39, 687 | "metadata": {}, 688 | "outputs": [], 689 | "source": [ 690 | "def learning_curve(x, y, xval, yval, lambda_):\n", 691 | " m,n = x.shape\n", 692 | " et_array = np.zeros(m)\n", 693 | " ev_array = np.zeros(m)\n", 694 | " for i in range(1,m):\n", 695 | " et_array[i] , ev_array[i] = train_val_error(x[0:i,:],y[0:i],xval,yval,lambda_)\n", 696 | " return (et_array,ev_array)" 697 | ] 698 | }, 699 | { 700 | "cell_type": "code", 701 | "execution_count": 56, 702 | "metadata": {}, 703 | "outputs": [ 704 | { 705 | "name": "stdout", 706 | "output_type": "stream", 707 | "text": [ 708 | "Warning: Desired error not necessarily achieved due to precision loss.\n", 709 | " Current function value: 0.000001\n", 710 | " Iterations: 7\n", 711 | " Function evaluations: 145\n", 712 | " Gradient evaluations: 133\n", 713 | "Warning: Desired error not necessarily achieved due to precision loss.\n", 714 | " Current function value: 0.000001\n", 715 | " Iterations: 11\n", 716 | " Function evaluations: 130\n", 717 | " Gradient evaluations: 118\n", 718 | "Warning: Desired error not necessarily achieved due to precision loss.\n", 719 | " Current function value: 0.821654\n", 720 | " Iterations: 12\n", 721 | " Function evaluations: 133\n", 722 | " Gradient evaluations: 118\n", 723 | "Warning: Desired error not necessarily achieved due to precision loss.\n", 724 | " Current function value: 0.947566\n", 725 | " Iterations: 12\n", 726 | " Function evaluations: 89\n", 727 | " Gradient evaluations: 76\n", 728 | "Warning: Desired error not necessarily achieved due to precision loss.\n", 729 | " Current function value: 5.480855\n", 730 | " Iterations: 10\n", 731 | " Function evaluations: 135\n", 732 | " Gradient evaluations: 123\n", 733 | "Warning: Desired error not necessarily achieved due to precision loss.\n", 734 | " Current function value: 9.721983\n", 735 | " Iterations: 15\n", 736 | " Function evaluations: 130\n", 737 | " Gradient evaluations: 118\n", 738 | "Warning: Desired error not necessarily achieved due to precision loss.\n", 739 | " Current function value: 11.724155\n", 740 | " Iterations: 13\n", 741 | " Function evaluations: 132\n", 742 | " Gradient evaluations: 118\n", 743 | "Warning: Desired error not necessarily achieved due to precision loss.\n", 744 | " Current function value: 12.115397\n", 745 | " Iterations: 8\n", 746 | " Function evaluations: 78\n", 747 | " Gradient evaluations: 67\n", 748 | "Warning: Desired error not necessarily achieved due to precision loss.\n", 749 | " Current function value: 16.957055\n", 750 | " Iterations: 14\n", 751 | " Function evaluations: 109\n", 752 | " Gradient evaluations: 94\n", 753 | "Warning: Desired error not necessarily achieved due to precision loss.\n", 754 | " Current function value: 19.384552\n", 755 | " Iterations: 9\n", 756 | " Function evaluations: 118\n", 757 | " Gradient evaluations: 106\n", 758 | "Warning: Desired error not necessarily achieved due to precision loss.\n", 759 | " Current function value: 22.290813\n", 760 | " Iterations: 22\n", 761 | " Function evaluations: 141\n", 762 | " Gradient evaluations: 128\n" 763 | ] 764 | } 765 | ], 766 | "source": [ 767 | "error_train, error_val = learning_curve(x,y,xval,yval,lambda_,)" 768 | ] 769 | }, 770 | { 771 | "cell_type": "markdown", 772 | "metadata": {}, 773 | "source": [ 774 | "## 5.2 Ploting Learning Curve\n", 775 | "You must observe that both the **train error and cross validation error are high** when the number of **training examples** is **increased**. This reflects a **high bias** problem in the model. (the **linear regression** model is too simple and is unable to fit our dataset well so it is **underfitting**)" 776 | ] 777 | }, 778 | { 779 | "cell_type": "code", 780 | "execution_count": 74, 781 | "metadata": {}, 782 | "outputs": [ 783 | { 784 | "data": { 785 | "image/png": "\n", 786 | "text/plain": [ 787 | "
" 788 | ] 789 | }, 790 | "metadata": {}, 791 | "output_type": "display_data" 792 | } 793 | ], 794 | "source": [ 795 | "plt.plot(np.arange(2,m+1),error_train[1:], label = 'train error')\n", 796 | "plt.plot(np.arange(2,m+1),error_val[1:], label = 'cross validation error', color= 'green')\n", 797 | "plt.axis([0, 12, 0, 160])\n", 798 | "plt.title('Training Set')\n", 799 | "plt.xlabel('Number of training examples (x)')\n", 800 | "plt.ylabel('Error (y)')\n", 801 | "plt.grid()\n", 802 | "plt.legend()\n", 803 | "plt.show()" 804 | ] 805 | }, 806 | { 807 | "cell_type": "markdown", 808 | "metadata": {}, 809 | "source": [ 810 | "In the next section, you will implement **polynomial regression** to fit a better model for this dataset." 811 | ] 812 | } 813 | ], 814 | "metadata": { 815 | "kernelspec": { 816 | "display_name": "Python 3", 817 | "language": "python", 818 | "name": "python3" 819 | }, 820 | "language_info": { 821 | "codemirror_mode": { 822 | "name": "ipython", 823 | "version": 3 824 | }, 825 | "file_extension": ".py", 826 | "mimetype": "text/x-python", 827 | "name": "python", 828 | "nbconvert_exporter": "python", 829 | "pygments_lexer": "ipython3", 830 | "version": "3.6.6" 831 | } 832 | }, 833 | "nbformat": 4, 834 | "nbformat_minor": 2 835 | } 836 | -------------------------------------------------------------------------------- /Week 6 - Regularized Linear Regression and Bias v.s. Variance/Xtest.csv: -------------------------------------------------------------------------------- 1 | -3.331800399061839357e+01 2 | -3.791216402831621224e+01 3 | -5.120693794827316481e+01 4 | -6.132595848228624469e+00 5 | 2.126118327389842833e+01 6 | -4.031952949030852551e+01 7 | -1.454153167295283566e+01 8 | 3.255976024170858807e+01 9 | 1.339343254732885846e+01 10 | 4.420988594678166805e+01 11 | -1.142677675487955291e+00 12 | -1.276686065227885081e+01 13 | 3.405450538959663476e+01 14 | 3.922350027740379375e+01 15 | 1.974496739238940535e+00 16 | 2.962175509870446888e+01 17 | -2.366962970665967703e+01 18 | -9.011801392661441312e+00 19 | -5.594057090677502231e+01 20 | -3.570859751906493074e+01 21 | 9.510205326576553375e+00 22 | -------------------------------------------------------------------------------- /Week 6 - Regularized Linear Regression and Bias v.s. Variance/Xval.csv: -------------------------------------------------------------------------------- 1 | -1.674653577802068938e+01 2 | -1.457747074924186848e+01 3 | 3.451575865729932246e+01 4 | -4.701007574320075832e+01 5 | 3.697511904636278501e+01 6 | -4.068611001536747551e+01 7 | -4.472010975766456120e+00 8 | 2.653363489478886095e+01 9 | -4.279768310017955457e+01 10 | 2.537409938352766403e+01 11 | -3.110955397730775118e+01 12 | 2.731176863521341147e+01 13 | -3.263862013656720684e+00 14 | -1.818276487115874751e+00 15 | -4.071966240251615687e+01 16 | -5.001324364549542878e+01 17 | -1.741177154801637883e+01 18 | 3.588193696644128572e+00 19 | 7.085480261970673155e+00 20 | 4.628236901853892959e+01 21 | 1.461228909165653889e+01 22 | -------------------------------------------------------------------------------- /Week 6 - Regularized Linear Regression and Bias v.s. Variance/ex5data1.mat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 6 - Regularized Linear Regression and Bias v.s. Variance/ex5data1.mat -------------------------------------------------------------------------------- /Week 6 - Regularized Linear Regression and Bias v.s. Variance/img/jtrain.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 6 - Regularized Linear Regression and Bias v.s. Variance/img/jtrain.JPG -------------------------------------------------------------------------------- /Week 6 - Regularized Linear Regression and Bias v.s. Variance/img/poly.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 6 - Regularized Linear Regression and Bias v.s. Variance/img/poly.JPG -------------------------------------------------------------------------------- /Week 6 - Regularized Linear Regression and Bias v.s. Variance/img/rlrc.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 6 - Regularized Linear Regression and Bias v.s. Variance/img/rlrc.JPG -------------------------------------------------------------------------------- /Week 6 - Regularized Linear Regression and Bias v.s. Variance/img/rlrg.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Nikronic/Coursera-Machine-Learning/4bc5de16446b664f9995eba95762b730547b1fce/Week 6 - Regularized Linear Regression and Bias v.s. Variance/img/rlrg.JPG -------------------------------------------------------------------------------- /Week 6 - Regularized Linear Regression and Bias v.s. Variance/ytest.csv: -------------------------------------------------------------------------------- 1 | 3.316889531756360476e+00 2 | 5.397689520216154335e+00 3 | 1.304298374520143078e-01 4 | 6.192598202383872596e+00 5 | 1.708848711547617327e+01 6 | 7.995080467101720600e-01 7 | 2.824791834378351130e+00 8 | 2.862123333554546889e+01 9 | 1.704639080632776782e+01 10 | 5.538437334220785857e+01 11 | 4.079367333128050888e+00 12 | 8.270397934583032296e+00 13 | 3.132355101950563281e+01 14 | 3.915906103292760321e+01 15 | 8.087279893552164367e+00 16 | 2.411134389353750151e+01 17 | 2.477354802758796826e+00 18 | 6.566064719303037478e+00 19 | 6.038088801572035536e+00 20 | 4.692739558592498916e+00 21 | 1.083004606320572805e+01 22 | -------------------------------------------------------------------------------- /Week 6 - Regularized Linear Regression and Bias v.s. Variance/yval.csv: -------------------------------------------------------------------------------- 1 | 4.170202008850626640e+00 2 | 4.067262803838972651e+00 3 | 3.187306757578932803e+01 4 | 1.062365618969514536e+01 5 | 3.183602128133837184e+01 6 | 4.959369720997110598e+00 7 | 4.451598803470352195e+00 8 | 2.227631845748983963e+01 9 | -4.387382739157175138e-05 10 | 2.050380157930803549e+01 11 | 3.858344762697331731e+00 12 | 1.936505291560758124e+01 13 | 4.883762805453054412e+00 14 | 1.109715884838211863e+01 15 | 7.461708266154005287e+00 16 | 1.476934642298386446e+00 17 | 2.719163877647038152e+00 18 | 1.092690065536872979e+01 19 | 8.348712346301107701e+00 20 | 5.278192797904378608e+01 21 | 1.335733960607468696e+01 22 | --------------------------------------------------------------------------------