├── .gitignore.txt ├── ChatGPT Image Mar 30, 2025, 11_17_06 AM.png ├── ChatGPT Image Small.png ├── Course Image.png ├── Homeworks ├── Logistic Regression_Homework_Public.ipynb ├── Scikit-Learn - Linear Regression Homework_Public.ipynb ├── Scikit-Learn - Logistic Regression Homework_Public.ipynb ├── Week 1.ipynb └── Week 3 - Homework 2 - Public .pdf ├── LICENSE ├── Notebooks ├── Autoencoder.ipynb ├── CNN Lab.ipynb ├── Decision Tree.ipynb ├── Feature Engineering.ipynb ├── Lab 3 - Gradient Descent.ipynb ├── Linear Regression.ipynb ├── Logistic Regression.ipynb ├── Neural Network from Scratch.ipynb ├── PyTorch_Tutorial.ipynb └── Regularization and Cross-Validation.ipynb ├── README.md ├── Reading Materials ├── Autoencoders.pdf ├── Convolutional_Neural_Networks.pdf ├── Feature Representation.pdf ├── Gradient_Descent.pdf ├── Introduction.pdf ├── Linear Classification.pdf ├── Linear Regression.pdf ├── Neural_Networks.pdf ├── Neural_Networks_Part 2.pdf └── Non-parametric methods.pdf ├── Topic 1 └── Intro_General.pdf ├── Topic 2 └── Lecture 2 - Linear Regression, Regularization and Cross-Validation.pdf ├── Topic 3 └── Lecture 3 - Gradient Descent.pdf ├── Topic 4 └── Lecture 4 - Linear Classification.pdf ├── Topic 5 ├── Addtional Material - Scikit-Learn.pdf └── Lecture 5 - Feature Engineering.pdf ├── Topic 6 └── Lecture 6 -Neural Network.pdf ├── Topic 7 └── Lecture 7 - Neural Network - AutoEncoder.pdf ├── Topic 8 └── Lecture 8 - Convolutional Neural Network.pdf ├── Topic 9 └── Lecture 9 - Non-Parametric Models.pdf └── requirements.txt /.gitignore.txt: -------------------------------------------------------------------------------- 1 | Intro_General.pptx 2 | Lecture 2 - Linear Regression, Regularization and Cross-Validation.pptx -------------------------------------------------------------------------------- /ChatGPT Image Mar 30, 2025, 11_17_06 AM.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/ChatGPT Image Mar 30, 2025, 11_17_06 AM.png -------------------------------------------------------------------------------- /ChatGPT Image Small.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/ChatGPT Image Small.png -------------------------------------------------------------------------------- /Course Image.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Course Image.png -------------------------------------------------------------------------------- /Homeworks/Logistic Regression_Homework_Public.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "metadata": {}, 6 | "source": [ 7 | "## Homework 3 \n", 8 | "\n", 9 | "PAML 2024,\n", 10 | "\n", 11 | "Rina Buoy, PhD" 12 | ] 13 | }, 14 | { 15 | "cell_type": "markdown", 16 | "metadata": {}, 17 | "source": [ 18 | "YOUR FULL NAME: " 19 | ] 20 | }, 21 | { 22 | "cell_type": "code", 23 | "execution_count": null, 24 | "metadata": {}, 25 | "outputs": [], 26 | "source": [ 27 | "import numpy as np\n", 28 | "import pandas as pd\n", 29 | "import matplotlib.pyplot as plt\n", 30 | "from sklearn.model_selection import train_test_split\n", 31 | "#from sklearn.preprocessing import LabelEncoder\n", 32 | "\n", 33 | "# Logistic Regression class with Gradient Descent (same as above)\n", 34 | "class LogisticRegressionGD:\n", 35 | " def __init__(self, learning_rate=0.01, iterations=1000):\n", 36 | " self.learning_rate = learning_rate\n", 37 | " self.iterations = iterations\n", 38 | "\n", 39 | " def sigmoid(self, z):\n", 40 | " \"\"\"Sigmoid function to map predictions to probabilities.\"\"\"\n", 41 | " return 1 / (1 + np.exp(-z))\n", 42 | "\n", 43 | " def fit(self, X, y):\n", 44 | " \"\"\"Training the logistic regression model using gradient descent.\"\"\"\n", 45 | " self.m, self.n = X.shape\n", 46 | " self.theta = np.zeros(self.n)\n", 47 | " self.bias = 0\n", 48 | "\n", 49 | " for i in range(self.iterations):\n", 50 | " z = np.dot(X, self.theta) + self.bias\n", 51 | " y_pred = self.sigmoid(z)\n", 52 | " dw = (1 / self.m) * np.dot(X.T, (y_pred - y))\n", 53 | " db = (1 / self.m) * np.sum(y_pred - y)\n", 54 | " self.theta -= self.learning_rate * dw\n", 55 | " self.bias -= self.learning_rate * db\n", 56 | " \n", 57 | " def predict(self, X):\n", 58 | " z = np.dot(X, self.theta) + self.bias\n", 59 | " y_pred = self.sigmoid(z)\n", 60 | " return [1 if i > 0.5 else 0 for i in y_pred]\n", 61 | "\n", 62 | "\n", 63 | "\n" 64 | ] 65 | }, 66 | { 67 | "cell_type": "markdown", 68 | "metadata": {}, 69 | "source": [ 70 | "### GOAL\n", 71 | "\n", 72 | "Apply the provided logistic regression solver to a Congressional Voting Records dataset." 73 | ] 74 | }, 75 | { 76 | "cell_type": "code", 77 | "execution_count": 3, 78 | "metadata": {}, 79 | "outputs": [], 80 | "source": [ 81 | "# Load the Congressional Voting Records dataset\n", 82 | "url = \"https://archive.ics.uci.edu/ml/machine-learning-databases/voting-records/house-votes-84.data\"\n", 83 | "columns = ['party', 'handicapped-infants', 'water-project', 'budget', 'physician-fee-freeze',\n", 84 | " 'el-salvador-aid', 'religious-groups', 'anti-satellite-ban', 'aid-to-contras',\n", 85 | " 'mx-missile', 'immigration', 'synfuels', 'education', 'superfund-sue', 'crime',\n", 86 | " 'duty-free', 'south-africa']" 87 | ] 88 | }, 89 | { 90 | "cell_type": "markdown", 91 | "metadata": {}, 92 | "source": [ 93 | "#### TASK 1:\n", 94 | "\n", 95 | "(a) Load the above dataset using Pandas, \n", 96 | "\n", 97 | "(b) Replace 'y' with 1 and 'n' with 0, \n", 98 | "\n", 99 | "(c) Handle missing data by filling it with the mode of each column\n", 100 | "\n", 101 | "\n", 102 | "\n", 103 | "\n" 104 | ] 105 | }, 106 | { 107 | "cell_type": "code", 108 | "execution_count": 2, 109 | "metadata": {}, 110 | "outputs": [], 111 | "source": [ 112 | "### YOUR CODES" 113 | ] 114 | }, 115 | { 116 | "cell_type": "markdown", 117 | "metadata": {}, 118 | "source": [ 119 | "#### TASK 2:\n", 120 | "\n", 121 | "(a) Extract the feature matrix, X, and the target vector, y\n", 122 | "\n", 123 | "(b) Split it into train and test sets using train_test_split" 124 | ] 125 | }, 126 | { 127 | "cell_type": "code", 128 | "execution_count": null, 129 | "metadata": {}, 130 | "outputs": [], 131 | "source": [ 132 | "### YOUR CODES\n", 133 | "\n" 134 | ] 135 | }, 136 | { 137 | "cell_type": "markdown", 138 | "metadata": {}, 139 | "source": [ 140 | "#### TASK 3:\n", 141 | "\n", 142 | "(a) Create and train the model on the train set \n", 143 | "\n", 144 | "(b) Compute the accuracy on the test set" 145 | ] 146 | }, 147 | { 148 | "cell_type": "code", 149 | "execution_count": null, 150 | "metadata": {}, 151 | "outputs": [], 152 | "source": [ 153 | "### YOUR CODES" 154 | ] 155 | } 156 | ], 157 | "metadata": { 158 | "kernelspec": { 159 | "display_name": "base", 160 | "language": "python", 161 | "name": "python3" 162 | }, 163 | "language_info": { 164 | "codemirror_mode": { 165 | "name": "ipython", 166 | "version": 3 167 | }, 168 | "file_extension": ".py", 169 | "mimetype": "text/x-python", 170 | "name": "python", 171 | "nbconvert_exporter": "python", 172 | "pygments_lexer": "ipython3", 173 | "version": "3.11.5" 174 | } 175 | }, 176 | "nbformat": 4, 177 | "nbformat_minor": 2 178 | } 179 | -------------------------------------------------------------------------------- /Homeworks/Scikit-Learn - Linear Regression Homework_Public.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "metadata": {}, 6 | "source": [ 7 | "## Homework 5\n", 8 | "\n", 9 | "PAML 2024,\n", 10 | "\n", 11 | "Rina Buoy, PhD" 12 | ] 13 | }, 14 | { 15 | "cell_type": "markdown", 16 | "metadata": {}, 17 | "source": [ 18 | "YOUR FULL NAME: " 19 | ] 20 | }, 21 | { 22 | "cell_type": "code", 23 | "execution_count": 13, 24 | "metadata": {}, 25 | "outputs": [], 26 | "source": [ 27 | "# Import necessary libraries\n", 28 | "from sklearn.model_selection import train_test_split\n", 29 | "from sklearn.linear_model import LinearRegression\n", 30 | "from sklearn.datasets import fetch_california_housing\n", 31 | "from sklearn.metrics import r2_score" 32 | ] 33 | }, 34 | { 35 | "cell_type": "markdown", 36 | "metadata": {}, 37 | "source": [ 38 | "### Applying Linear Regression with Scikit-Learn" 39 | ] 40 | }, 41 | { 42 | "cell_type": "markdown", 43 | "metadata": {}, 44 | "source": [ 45 | "#### Task 1: Applying Linear Regression with Scikit-Learn\n" 46 | ] 47 | }, 48 | { 49 | "cell_type": "code", 50 | "execution_count": 14, 51 | "metadata": {}, 52 | "outputs": [], 53 | "source": [ 54 | "\n", 55 | "# Load the California Housing dataset from Scikit-Learn dataset\n", 56 | "# Store Feature Matrix as X, and target variable as y\n" 57 | ] 58 | }, 59 | { 60 | "cell_type": "markdown", 61 | "metadata": {}, 62 | "source": [ 63 | "#### Task 2: Split X, y into train and test sets\n" 64 | ] 65 | }, 66 | { 67 | "cell_type": "code", 68 | "execution_count": 15, 69 | "metadata": {}, 70 | "outputs": [], 71 | "source": [ 72 | "\n", 73 | "# Split the dataset into training and testing sets\n" 74 | ] 75 | }, 76 | { 77 | "cell_type": "markdown", 78 | "metadata": {}, 79 | "source": [ 80 | "#### Task 3: Train a Linear regression using LinearRegression sklearn.linear_model" 81 | ] 82 | }, 83 | { 84 | "cell_type": "code", 85 | "execution_count": 16, 86 | "metadata": {}, 87 | "outputs": [], 88 | "source": [ 89 | "\n", 90 | "\n", 91 | "# Create a logistic regression model\n", 92 | "# Train the model on the training data\n" 93 | ] 94 | }, 95 | { 96 | "cell_type": "markdown", 97 | "metadata": {}, 98 | "source": [ 99 | "#### Task 4: Compute R-squared on the test set using r2_square from sklearn.metrics" 100 | ] 101 | }, 102 | { 103 | "cell_type": "code", 104 | "execution_count": 17, 105 | "metadata": {}, 106 | "outputs": [], 107 | "source": [ 108 | "# Compute the R-quared on the test set" 109 | ] 110 | }, 111 | { 112 | "cell_type": "markdown", 113 | "metadata": {}, 114 | "source": [ 115 | "#### Task 5: What can be done further to improve the R-sqaured ?" 116 | ] 117 | }, 118 | { 119 | "cell_type": "code", 120 | "execution_count": 18, 121 | "metadata": {}, 122 | "outputs": [], 123 | "source": [ 124 | "# Frame your answer in the context of feature engineering lecture." 125 | ] 126 | }, 127 | { 128 | "cell_type": "code", 129 | "execution_count": null, 130 | "metadata": {}, 131 | "outputs": [], 132 | "source": [] 133 | } 134 | ], 135 | "metadata": { 136 | "kernelspec": { 137 | "display_name": "base", 138 | "language": "python", 139 | "name": "python3" 140 | }, 141 | "language_info": { 142 | "codemirror_mode": { 143 | "name": "ipython", 144 | "version": 3 145 | }, 146 | "file_extension": ".py", 147 | "mimetype": "text/x-python", 148 | "name": "python", 149 | "nbconvert_exporter": "python", 150 | "pygments_lexer": "ipython3", 151 | "version": "3.11.5" 152 | } 153 | }, 154 | "nbformat": 4, 155 | "nbformat_minor": 2 156 | } 157 | -------------------------------------------------------------------------------- /Homeworks/Scikit-Learn - Logistic Regression Homework_Public.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "metadata": {}, 6 | "source": [ 7 | "## Homework 4\n", 8 | "\n", 9 | "PAML 2024,\n", 10 | "\n", 11 | "Rina Buoy, PhD" 12 | ] 13 | }, 14 | { 15 | "cell_type": "markdown", 16 | "metadata": {}, 17 | "source": [ 18 | "YOUR FULL NAME: " 19 | ] 20 | }, 21 | { 22 | "cell_type": "code", 23 | "execution_count": 1, 24 | "metadata": {}, 25 | "outputs": [], 26 | "source": [ 27 | "# Import necessary libraries\n", 28 | "import numpy as np\n", 29 | "from sklearn.model_selection import train_test_split\n", 30 | "from sklearn.linear_model import LogisticRegression\n", 31 | "from sklearn import datasets\n", 32 | "from sklearn.metrics import accuracy_score" 33 | ] 34 | }, 35 | { 36 | "cell_type": "markdown", 37 | "metadata": {}, 38 | "source": [ 39 | "### Applying Logistic Regression with Scikit-Learn" 40 | ] 41 | }, 42 | { 43 | "cell_type": "markdown", 44 | "metadata": {}, 45 | "source": [ 46 | "#### Task 1: Applying Logistic Regression with Scikit-Learn\n" 47 | ] 48 | }, 49 | { 50 | "cell_type": "code", 51 | "execution_count": 2, 52 | "metadata": {}, 53 | "outputs": [], 54 | "source": [ 55 | "\n", 56 | "# Load the Breast Cancer dataset from Scikit-Learn dataset\n", 57 | "# Store Feature Matrix as X, and target variable as y\n" 58 | ] 59 | }, 60 | { 61 | "cell_type": "markdown", 62 | "metadata": {}, 63 | "source": [ 64 | "#### Task 2: Split X, y into train and test sets\n" 65 | ] 66 | }, 67 | { 68 | "cell_type": "code", 69 | "execution_count": 3, 70 | "metadata": {}, 71 | "outputs": [], 72 | "source": [ 73 | "\n", 74 | "# Split the dataset into training and testing sets\n" 75 | ] 76 | }, 77 | { 78 | "cell_type": "markdown", 79 | "metadata": {}, 80 | "source": [ 81 | "#### Task 3: Train a logistic regression using LogisticRegression sklearn.linear_model" 82 | ] 83 | }, 84 | { 85 | "cell_type": "code", 86 | "execution_count": 4, 87 | "metadata": {}, 88 | "outputs": [], 89 | "source": [ 90 | "\n", 91 | "\n", 92 | "# Create a logistic regression model\n", 93 | "# Train the model on the training data\n" 94 | ] 95 | }, 96 | { 97 | "cell_type": "markdown", 98 | "metadata": {}, 99 | "source": [ 100 | "#### Task 4: Compute accuracy on the test set using accuracy_score from sklearn.metrics" 101 | ] 102 | }, 103 | { 104 | "cell_type": "code", 105 | "execution_count": 5, 106 | "metadata": {}, 107 | "outputs": [], 108 | "source": [ 109 | "# Compute the accuracy on the test set" 110 | ] 111 | }, 112 | { 113 | "cell_type": "markdown", 114 | "metadata": {}, 115 | "source": [ 116 | "#### Task 5: What can be done further to improve the accuracy ?" 117 | ] 118 | }, 119 | { 120 | "cell_type": "code", 121 | "execution_count": 6, 122 | "metadata": {}, 123 | "outputs": [], 124 | "source": [ 125 | "# Frame your answer in the context of feature engineering lecture." 126 | ] 127 | }, 128 | { 129 | "cell_type": "markdown", 130 | "metadata": {}, 131 | "source": [] 132 | } 133 | ], 134 | "metadata": { 135 | "kernelspec": { 136 | "display_name": "base", 137 | "language": "python", 138 | "name": "python3" 139 | }, 140 | "language_info": { 141 | "codemirror_mode": { 142 | "name": "ipython", 143 | "version": 3 144 | }, 145 | "file_extension": ".py", 146 | "mimetype": "text/x-python", 147 | "name": "python", 148 | "nbconvert_exporter": "python", 149 | "pygments_lexer": "ipython3", 150 | "version": "3.11.5" 151 | } 152 | }, 153 | "nbformat": 4, 154 | "nbformat_minor": 2 155 | } 156 | -------------------------------------------------------------------------------- /Homeworks/Week 1.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "metadata": {}, 6 | "source": [ 7 | "# Week 1: Homework" 8 | ] 9 | }, 10 | { 11 | "cell_type": "markdown", 12 | "metadata": {}, 13 | "source": [ 14 | "## Instructions for Students:\n", 15 | "\n", 16 | "Complete the code cells with the exercises indicated by comments and print out the outputs.\n" 17 | ] 18 | }, 19 | { 20 | "cell_type": "code", 21 | "execution_count": 5, 22 | "metadata": {}, 23 | "outputs": [], 24 | "source": [ 25 | "\n", 26 | "# Import the necessary libraries\n" 27 | ] 28 | }, 29 | { 30 | "cell_type": "markdown", 31 | "metadata": {}, 32 | "source": [ 33 | "### Part 1: NumPy Exercises" 34 | ] 35 | }, 36 | { 37 | "cell_type": "code", 38 | "execution_count": 6, 39 | "metadata": {}, 40 | "outputs": [ 41 | { 42 | "name": "stdout", 43 | "output_type": "stream", 44 | "text": [ 45 | "### Part 1: Linear Algebra with NumPy ###\n" 46 | ] 47 | } 48 | ], 49 | "source": [ 50 | "\n", 51 | "print(\"### Part 1: Linear Algebra with NumPy ###\")\n", 52 | "\n", 53 | "\n" 54 | ] 55 | }, 56 | { 57 | "cell_type": "code", 58 | "execution_count": 7, 59 | "metadata": {}, 60 | "outputs": [], 61 | "source": [ 62 | "\n", 63 | "# 1. Create a 3x3 matrix with values ranging from 1 to 9\n" 64 | ] 65 | }, 66 | { 67 | "cell_type": "code", 68 | "execution_count": 8, 69 | "metadata": {}, 70 | "outputs": [], 71 | "source": [ 72 | "# 2. Create a 3x1 vector with values ranging from 10 to 12\n", 73 | "\n" 74 | ] 75 | }, 76 | { 77 | "cell_type": "code", 78 | "execution_count": 9, 79 | "metadata": {}, 80 | "outputs": [], 81 | "source": [ 82 | "# 3. Perform matrix multiplication between the matrix and vector\n" 83 | ] 84 | }, 85 | { 86 | "cell_type": "code", 87 | "execution_count": 10, 88 | "metadata": {}, 89 | "outputs": [], 90 | "source": [ 91 | "# 4. Find the determinant of the matrix\n" 92 | ] 93 | }, 94 | { 95 | "cell_type": "code", 96 | "execution_count": 11, 97 | "metadata": {}, 98 | "outputs": [], 99 | "source": [ 100 | "# 5. Find the inverse of the matrix (if it exists)\n" 101 | ] 102 | }, 103 | { 104 | "cell_type": "markdown", 105 | "metadata": {}, 106 | "source": [ 107 | "### Part 2: Working with DataFrames and Pandas" 108 | ] 109 | }, 110 | { 111 | "cell_type": "code", 112 | "execution_count": 12, 113 | "metadata": {}, 114 | "outputs": [ 115 | { 116 | "name": "stdout", 117 | "output_type": "stream", 118 | "text": [ 119 | "\n", 120 | "### Part 2: Linear Algebra with Pandas ###\n" 121 | ] 122 | } 123 | ], 124 | "source": [ 125 | "\n", 126 | "print(\"\\n### Part 2: Linear Algebra with Pandas ###\")" 127 | ] 128 | }, 129 | { 130 | "cell_type": "code", 131 | "execution_count": 13, 132 | "metadata": {}, 133 | "outputs": [], 134 | "source": [ 135 | "# 6. Create a DataFrame from a Numpy Matrix\n" 136 | ] 137 | }, 138 | { 139 | "cell_type": "code", 140 | "execution_count": 14, 141 | "metadata": {}, 142 | "outputs": [], 143 | "source": [ 144 | "# 7. Find the row-wise and column-wise mean of the DataFrame\n" 145 | ] 146 | }, 147 | { 148 | "cell_type": "code", 149 | "execution_count": 15, 150 | "metadata": {}, 151 | "outputs": [], 152 | "source": [ 153 | "# 8. Convert the DataFrame back to a NumPy array\n", 154 | "\n" 155 | ] 156 | }, 157 | { 158 | "cell_type": "code", 159 | "execution_count": 16, 160 | "metadata": {}, 161 | "outputs": [], 162 | "source": [ 163 | "# 9. Find the eigenvalues and eigenvectors of a Numpy Matrix" 164 | ] 165 | } 166 | ], 167 | "metadata": { 168 | "kernelspec": { 169 | "display_name": "base", 170 | "language": "python", 171 | "name": "python3" 172 | }, 173 | "language_info": { 174 | "codemirror_mode": { 175 | "name": "ipython", 176 | "version": 3 177 | }, 178 | "file_extension": ".py", 179 | "mimetype": "text/x-python", 180 | "name": "python", 181 | "nbconvert_exporter": "python", 182 | "pygments_lexer": "ipython3", 183 | "version": "3.11.5" 184 | } 185 | }, 186 | "nbformat": 4, 187 | "nbformat_minor": 2 188 | } 189 | -------------------------------------------------------------------------------- /Homeworks/Week 3 - Homework 2 - Public .pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Homeworks/Week 3 - Homework 2 - Public .pdf -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- 1 | MIT License 2 | 3 | Copyright (c) 2024 Rina Buoy 4 | 5 | Permission is hereby granted, free of charge, to any person obtaining a copy 6 | of this software and associated documentation files (the "Software"), to deal 7 | in the Software without restriction, including without limitation the rights 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 9 | copies of the Software, and to permit persons to whom the Software is 10 | furnished to do so, subject to the following conditions: 11 | 12 | The above copyright notice and this permission notice shall be included in all 13 | copies or substantial portions of the Software. 14 | 15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 21 | SOFTWARE. 22 | -------------------------------------------------------------------------------- /Notebooks/Autoencoder.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "metadata": {}, 6 | "source": [ 7 | "## An Autoencoder From Scratch\n", 8 | "\n", 9 | "by Rina Buoy, PhD" 10 | ] 11 | }, 12 | { 13 | "cell_type": "markdown", 14 | "metadata": {}, 15 | "source": [ 16 | "1. Network Structure:\n", 17 | "\n", 18 | "The encoder layer compresses the input image (784 dimensions) into a smaller hidden last representation (64 dimensions).\n", 19 | "The decoder reconstructs the image from this compressed representation.\n", 20 | "\n", 21 | "2. Training:\n", 22 | "\n", 23 | "The model is trained on the MNIST training set, flattened and normalized to values between 0 and 1.\n", 24 | "We use Mean Squared Error as the loss and print it every 10 epochs.\n", 25 | "\n", 26 | "3. Reconstruction Visualization:\n", 27 | "\n", 28 | "The visualize_reconstruction function uses matplotlib to display original and reconstructed images side-by-side for comparison.\n", 29 | "\n", 30 | "4. Running and Observing:\n", 31 | "\n", 32 | "You should see the loss decrease over epochs, and the reconstructed images should look more like the originals as training progresses." 33 | ] 34 | }, 35 | { 36 | "cell_type": "markdown", 37 | "metadata": {}, 38 | "source": [ 39 | "#### Step 1: Set up the imports" 40 | ] 41 | }, 42 | { 43 | "cell_type": "code", 44 | "execution_count": 1, 45 | "metadata": {}, 46 | "outputs": [], 47 | "source": [ 48 | "import numpy as np\n", 49 | "import torch\n", 50 | "from torchvision import datasets, transforms\n", 51 | "import matplotlib.pyplot as plt" 52 | ] 53 | }, 54 | { 55 | "cell_type": "markdown", 56 | "metadata": {}, 57 | "source": [ 58 | "### Step 2: Helper Functions" 59 | ] 60 | }, 61 | { 62 | "cell_type": "code", 63 | "execution_count": 2, 64 | "metadata": {}, 65 | "outputs": [], 66 | "source": [ 67 | "\n", 68 | "# Define the activation functions\n", 69 | "def sigmoid(x):\n", 70 | " x= np.clip( x, -500, 500 )\n", 71 | " return 1 / (1 + np.exp(-x))\n", 72 | "\n", 73 | "def sigmoid_derivative(x):\n", 74 | " return x * (1 - x)\n", 75 | "\n", 76 | "# Mean squared error loss function\n", 77 | "def mean_squared_error(y_true, y_pred):\n", 78 | " return np.mean((y_true - y_pred) ** 2)" 79 | ] 80 | }, 81 | { 82 | "cell_type": "markdown", 83 | "metadata": {}, 84 | "source": [ 85 | "### Step 3: Define the Neural Network Structure, Training Loops, Forward, and Backward Pass\n" 86 | ] 87 | }, 88 | { 89 | "cell_type": "code", 90 | "execution_count": 3, 91 | "metadata": {}, 92 | "outputs": [], 93 | "source": [ 94 | "# Define autoencoder parameters\n", 95 | "input_size = 28 * 28 # 784 for MNIST images\n", 96 | "hidden_size = 64 # Size of hidden layer\n", 97 | "output_size = input_size\n", 98 | "\n", 99 | "# Initialize weights and biases\n", 100 | "np.random.seed(42)\n", 101 | "W1 = np.random.randn(input_size, hidden_size) * 0.01\n", 102 | "b1 = np.zeros((1, hidden_size))\n", 103 | "W2 = np.random.randn(hidden_size, output_size) * 0.01\n", 104 | "b2 = np.zeros((1, output_size))\n", 105 | "\n", 106 | "# Activation and its derivative\n", 107 | "def relu(x):\n", 108 | " return np.maximum(0, x)\n", 109 | "\n", 110 | "def relu_derivative(x):\n", 111 | " return np.where(x > 0, 1, 0)\n", 112 | "\n", 113 | "# Forward pass\n", 114 | "def forward(X):\n", 115 | " Z1 = np.dot(X, W1) + b1\n", 116 | " A1 = relu(Z1)\n", 117 | " Z2 = np.dot(A1, W2) + b2\n", 118 | " return Z1, A1, Z2\n", 119 | "\n", 120 | "# Loss function\n", 121 | "def mse_loss(y_true, y_pred):\n", 122 | " return np.mean((y_true - y_pred) ** 2)\n", 123 | "\n", 124 | "# Backward pass\n", 125 | "def backward(X, Z1, A1, Z2, learning_rate=0.001):\n", 126 | " global W1, b1, W2, b2\n", 127 | " m = X.shape[0]\n", 128 | "\n", 129 | " # Gradients for output layer\n", 130 | " dZ2 = (Z2 - X) / m\n", 131 | " dW2 = np.dot(A1.T, dZ2)\n", 132 | " db2 = np.sum(dZ2, axis=0, keepdims=True)\n", 133 | "\n", 134 | " # Gradients for hidden layer\n", 135 | " dA1 = np.dot(dZ2, W2.T)\n", 136 | " dZ1 = dA1 * relu_derivative(Z1)\n", 137 | " dW1 = np.dot(X.T, dZ1)\n", 138 | " db1 = np.sum(dZ1, axis=0, keepdims=True)\n", 139 | "\n", 140 | " # Update weights and biases\n", 141 | " W1 -= learning_rate * dW1\n", 142 | " b1 -= learning_rate * db1\n", 143 | " W2 -= learning_rate * dW2\n", 144 | " b2 -= learning_rate * db2" 145 | ] 146 | }, 147 | { 148 | "cell_type": "markdown", 149 | "metadata": {}, 150 | "source": [ 151 | "### Step 4: Load and Pepare the dataset" 152 | ] 153 | }, 154 | { 155 | "cell_type": "code", 156 | "execution_count": 4, 157 | "metadata": {}, 158 | "outputs": [], 159 | "source": [ 160 | "# Load MNIST data using torchvision\n", 161 | "transform = transforms.Compose([transforms.ToTensor()])\n", 162 | "train_dataset = datasets.MNIST(root='./data', train=True, download=True, transform=transform)\n", 163 | "test_dataset = datasets.MNIST(root='./data', train=False, download=True, transform=transform)\n", 164 | "\n", 165 | "# Prepare data\n", 166 | "X_train = train_dataset.data.numpy().reshape(-1, 28 * 28) / 255.0 # Normalize and flatten to 784-dimensional vectors\n", 167 | "X_test = test_dataset.data.numpy().reshape(-1, 28 * 28) / 255.0" 168 | ] 169 | }, 170 | { 171 | "cell_type": "markdown", 172 | "metadata": {}, 173 | "source": [ 174 | "### Step 5: Model Instanciation and Training" 175 | ] 176 | }, 177 | { 178 | "cell_type": "code", 179 | "execution_count": 6, 180 | "metadata": {}, 181 | "outputs": [ 182 | { 183 | "name": "stdout", 184 | "output_type": "stream", 185 | "text": [ 186 | "Epoch 1, Loss: 0.0503\n", 187 | "Epoch 2, Loss: 0.0373\n", 188 | "Epoch 3, Loss: 0.0313\n", 189 | "Epoch 4, Loss: 0.0274\n", 190 | "Epoch 5, Loss: 0.0245\n", 191 | "Epoch 6, Loss: 0.0223\n", 192 | "Epoch 7, Loss: 0.0206\n", 193 | "Epoch 8, Loss: 0.0192\n", 194 | "Epoch 9, Loss: 0.0180\n", 195 | "Epoch 10, Loss: 0.0170\n", 196 | "Epoch 11, Loss: 0.0162\n", 197 | "Epoch 12, Loss: 0.0155\n" 198 | ] 199 | }, 200 | { 201 | "ename": "KeyboardInterrupt", 202 | "evalue": "", 203 | "output_type": "error", 204 | "traceback": [ 205 | "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m", 206 | "\u001b[1;31mKeyboardInterrupt\u001b[0m Traceback (most recent call last)", 207 | "Cell \u001b[1;32mIn[6], line 15\u001b[0m\n\u001b[0;32m 13\u001b[0m \u001b[38;5;66;03m# Calculate loss on training data\u001b[39;00m\n\u001b[0;32m 14\u001b[0m _, _, output \u001b[38;5;241m=\u001b[39m forward(X_train)\n\u001b[1;32m---> 15\u001b[0m loss \u001b[38;5;241m=\u001b[39m mse_loss(X_train, output)\n\u001b[0;32m 16\u001b[0m \u001b[38;5;28mprint\u001b[39m(\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mEpoch \u001b[39m\u001b[38;5;132;01m{\u001b[39;00mepoch\u001b[38;5;250m \u001b[39m\u001b[38;5;241m+\u001b[39m\u001b[38;5;250m \u001b[39m\u001b[38;5;241m1\u001b[39m\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m, Loss: \u001b[39m\u001b[38;5;132;01m{\u001b[39;00mloss\u001b[38;5;132;01m:\u001b[39;00m\u001b[38;5;124m.4f\u001b[39m\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m'\u001b[39m)\n", 208 | "Cell \u001b[1;32mIn[3], line 28\u001b[0m, in \u001b[0;36mmse_loss\u001b[1;34m(y_true, y_pred)\u001b[0m\n\u001b[0;32m 25\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m Z1, A1, Z2\n\u001b[0;32m 27\u001b[0m \u001b[38;5;66;03m# Loss function\u001b[39;00m\n\u001b[1;32m---> 28\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mmse_loss\u001b[39m(y_true, y_pred):\n\u001b[0;32m 29\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m np\u001b[38;5;241m.\u001b[39mmean((y_true \u001b[38;5;241m-\u001b[39m y_pred) \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39m \u001b[38;5;241m2\u001b[39m)\n\u001b[0;32m 31\u001b[0m \u001b[38;5;66;03m# Backward pass\u001b[39;00m\n", 209 | "\u001b[1;31mKeyboardInterrupt\u001b[0m: " 210 | ] 211 | } 212 | ], 213 | "source": [ 214 | "# Training the autoencoder\n", 215 | "# Training the autoencoder\n", 216 | "epochs = 20\n", 217 | "learning_rate = 0.001\n", 218 | "batch_size = 64\n", 219 | "\n", 220 | "for epoch in range(epochs):\n", 221 | " for i in range(0, X_train.shape[0], batch_size):\n", 222 | " X_batch = X_train[i:i+batch_size]\n", 223 | " Z1, A1, Z2 = forward(X_batch)\n", 224 | " backward(X_batch, Z1, A1, Z2, learning_rate)\n", 225 | " \n", 226 | " # Calculate loss on training data\n", 227 | " _, _, output = forward(X_train)\n", 228 | " loss = mse_loss(X_train, output)\n", 229 | " print(f'Epoch {epoch + 1}, Loss: {loss:.4f}')\n" 230 | ] 231 | }, 232 | { 233 | "cell_type": "markdown", 234 | "metadata": {}, 235 | "source": [ 236 | "### Step 6: Model Testing by Reconstruction" 237 | ] 238 | }, 239 | { 240 | "cell_type": "code", 241 | "execution_count": 7, 242 | "metadata": {}, 243 | "outputs": [ 244 | { 245 | "data": { 246 | "image/png": "", 247 | "text/plain": [ 248 | "
" 249 | ] 250 | }, 251 | "metadata": {}, 252 | "output_type": "display_data" 253 | } 254 | ], 255 | "source": [ 256 | "# Testing and visualizing the reconstructed images\n", 257 | "def plot_reconstructed_images(original, reconstructed, n=10):\n", 258 | " plt.figure(figsize=(20, 4))\n", 259 | " for i in range(n):\n", 260 | " # Original images\n", 261 | " ax = plt.subplot(2, n, i + 1)\n", 262 | " plt.imshow(original[i].reshape(28, 28), cmap=\"gray\")\n", 263 | " plt.axis(\"off\")\n", 264 | "\n", 265 | " # Reconstructed images\n", 266 | " ax = plt.subplot(2, n, i + 1 + n)\n", 267 | " plt.imshow(reconstructed[i].reshape(28, 28), cmap=\"gray\")\n", 268 | " plt.axis(\"off\")\n", 269 | " plt.show()\n", 270 | "\n", 271 | "# Test on x_test data\n", 272 | "_, _, x_test_reconstructed = forward(X_test)\n", 273 | "plot_reconstructed_images(X_test, x_test_reconstructed)" 274 | ] 275 | } 276 | ], 277 | "metadata": { 278 | "kernelspec": { 279 | "display_name": "base", 280 | "language": "python", 281 | "name": "python3" 282 | }, 283 | "language_info": { 284 | "codemirror_mode": { 285 | "name": "ipython", 286 | "version": 3 287 | }, 288 | "file_extension": ".py", 289 | "mimetype": "text/x-python", 290 | "name": "python", 291 | "nbconvert_exporter": "python", 292 | "pygments_lexer": "ipython3", 293 | "version": "3.11.5" 294 | } 295 | }, 296 | "nbformat": 4, 297 | "nbformat_minor": 2 298 | } 299 | -------------------------------------------------------------------------------- /Notebooks/Feature Engineering.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "metadata": {}, 6 | "source": [ 7 | "## Feature Engineering\n", 8 | "\n", 9 | "by Rina Buoy, PhD" 10 | ] 11 | }, 12 | { 13 | "cell_type": "markdown", 14 | "metadata": {}, 15 | "source": [ 16 | "### 1. Generating dummy data" 17 | ] 18 | }, 19 | { 20 | "cell_type": "code", 21 | "execution_count": 3, 22 | "metadata": {}, 23 | "outputs": [], 24 | "source": [ 25 | "# Import necessary libraries\n", 26 | "import pandas as pd\n", 27 | "import numpy as np\n", 28 | "\n", 29 | "# Sample dataset creation\n", 30 | "data = {\n", 31 | " 'age': [25, 32, 47, 51, 62],\n", 32 | " 'salary': [50000, 60000, 120000, 90000, 140000],\n", 33 | " 'gender': ['Male', 'Female', 'Female', 'Male', 'Female'],\n", 34 | " 'city': ['Osaka', 'Tokyo', 'Tokyo', 'Osaka', 'Kyoto'],\n", 35 | " 'bought_product': [1, 0, 1, 0, 1] # Target variable\n", 36 | "}\n", 37 | "\n", 38 | "\n", 39 | "# Create a DataFrame\n", 40 | "df = pd.DataFrame(data)\n" 41 | ] 42 | }, 43 | { 44 | "cell_type": "markdown", 45 | "metadata": {}, 46 | "source": [ 47 | "### 2. Feature Engineering" 48 | ] 49 | }, 50 | { 51 | "cell_type": "code", 52 | "execution_count": 4, 53 | "metadata": {}, 54 | "outputs": [], 55 | "source": [ 56 | "\n", 57 | "\n", 58 | "# Step 1: Feature Engineering - Adding new features\n", 59 | "# Add a new feature: salary per age\n", 60 | "df['salary_per_age'] = df['salary'] / df['age']\n", 61 | "\n", 62 | "# Step 2: Encoding Categorical Data\n", 63 | "# Manually encode 'gender' (Male -> 1, Female -> 0)\n", 64 | "df['gender_encoded'] = df['gender'].map({'Male': 1, 'Female': 0})\n", 65 | "\n", 66 | "# Manually encode 'city' using One-Hot Encoding\n", 67 | "df = pd.get_dummies(df, columns=['city'], drop_first=True) # Drop the first to avoid multicollinearity\n", 68 | "\n", 69 | "# Step 3: Normalization (Min-Max Scaling)\n", 70 | "def min_max_scaling(series):\n", 71 | " return (series - series.min()) / (series.max() - series.min())\n", 72 | "\n", 73 | "# Apply normalization to 'salary' and 'salary_per_age'\n", 74 | "df['salary'] = min_max_scaling(df['salary'])\n", 75 | "df['salary_per_age'] = min_max_scaling(df['salary_per_age'])\n", 76 | "\n", 77 | "# Step 4: Generating Polynomial Features\n", 78 | "def add_polynomial_features(df, columns, degree=2):\n", 79 | " for col in columns:\n", 80 | " for power in range(2, degree + 1):\n", 81 | " df[f'{col}_pow_{power}'] = df[col] ** power\n", 82 | " return df\n", 83 | "\n", 84 | "# Add polynomial features for 'age' and 'salary'\n", 85 | "df = add_polynomial_features(df, ['age', 'salary'], degree=2)\n", 86 | "\n", 87 | "\n" 88 | ] 89 | }, 90 | { 91 | "cell_type": "markdown", 92 | "metadata": {}, 93 | "source": [ 94 | "### 3. Final Features" 95 | ] 96 | }, 97 | { 98 | "cell_type": "code", 99 | "execution_count": 5, 100 | "metadata": {}, 101 | "outputs": [ 102 | { 103 | "name": "stdout", 104 | "output_type": "stream", 105 | "text": [ 106 | "Transformed Dataset:\n", 107 | " age salary gender bought_product salary_per_age gender_encoded \\\n", 108 | "0 25 0.000000 Male 1 0.298413 1 \n", 109 | "1 32 0.111111 Female 0 0.139881 0 \n", 110 | "2 47 0.777778 Female 1 1.000000 0 \n", 111 | "3 51 0.444444 Male 0 0.000000 1 \n", 112 | "4 62 1.000000 Female 1 0.625704 0 \n", 113 | "\n", 114 | " city_Osaka city_Tokyo age_pow_2 salary_pow_2 \n", 115 | "0 True False 625 0.000000 \n", 116 | "1 False True 1024 0.012346 \n", 117 | "2 False True 2209 0.604938 \n", 118 | "3 True False 2601 0.197531 \n", 119 | "4 False False 3844 1.000000 \n", 120 | "\n", 121 | "Features (X):\n", 122 | " age salary gender_encoded city_Osaka city_Tokyo age_pow_2 \\\n", 123 | "0 25 0.000000 1 True False 625 \n", 124 | "1 32 0.111111 0 False True 1024 \n", 125 | "2 47 0.777778 0 False True 2209 \n", 126 | "3 51 0.444444 1 True False 2601 \n", 127 | "4 62 1.000000 0 False False 3844 \n", 128 | "\n", 129 | " salary_pow_2 \n", 130 | "0 0.000000 \n", 131 | "1 0.012346 \n", 132 | "2 0.604938 \n", 133 | "3 0.197531 \n", 134 | "4 1.000000 \n", 135 | "\n", 136 | "Target (y):\n", 137 | "0 1\n", 138 | "1 0\n", 139 | "2 1\n", 140 | "3 0\n", 141 | "4 1\n", 142 | "Name: bought_product, dtype: int64\n" 143 | ] 144 | } 145 | ], 146 | "source": [ 147 | "# Final dataset after feature engineering, normalization, and encoding\n", 148 | "print(\"Transformed Dataset:\")\n", 149 | "print(df)\n", 150 | "\n", 151 | "# Optional: Split features (X) and target (y)\n", 152 | "X = df.drop(columns=['bought_product', 'gender', 'salary_per_age']) # Removing raw and unneeded columns\n", 153 | "y = df['bought_product']\n", 154 | "\n", 155 | "print(\"\\nFeatures (X):\")\n", 156 | "print(X)\n", 157 | "\n", 158 | "print(\"\\nTarget (y):\")\n", 159 | "print(y)" 160 | ] 161 | } 162 | ], 163 | "metadata": { 164 | "kernelspec": { 165 | "display_name": "base", 166 | "language": "python", 167 | "name": "python3" 168 | }, 169 | "language_info": { 170 | "codemirror_mode": { 171 | "name": "ipython", 172 | "version": 3 173 | }, 174 | "file_extension": ".py", 175 | "mimetype": "text/x-python", 176 | "name": "python", 177 | "nbconvert_exporter": "python", 178 | "pygments_lexer": "ipython3", 179 | "version": "3.11.5" 180 | } 181 | }, 182 | "nbformat": 4, 183 | "nbformat_minor": 2 184 | } 185 | -------------------------------------------------------------------------------- /Notebooks/Lab 3 - Gradient Descent.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "metadata": {}, 6 | "source": [ 7 | "Rina Buoy, PhD" 8 | ] 9 | }, 10 | { 11 | "cell_type": "markdown", 12 | "metadata": {}, 13 | "source": [ 14 | "## Generate Training Datasets" 15 | ] 16 | }, 17 | { 18 | "cell_type": "markdown", 19 | "metadata": {}, 20 | "source": [ 21 | "$\\hat{y}= \\theta_0 + \\theta_1x_1 + \\epsilon$\n", 22 | "\n", 23 | "$\\theta_0 = 4$\n", 24 | "\n", 25 | "$\\theta_1 = 3$\n" 26 | ] 27 | }, 28 | { 29 | "cell_type": "code", 30 | "execution_count": 5, 31 | "metadata": {}, 32 | "outputs": [], 33 | "source": [ 34 | "import numpy as np\n", 35 | "import matplotlib.pyplot as plt\n", 36 | "\n", 37 | "# Generate some random data for demonstration\n", 38 | "np.random.seed(0)\n", 39 | "X = 2 * np.random.rand(100, 1) # epsilon \n", 40 | "y = 4 + 3 * X + np.random.randn(100, 1) # y_hat\n", 41 | "\n", 42 | "\n" 43 | ] 44 | }, 45 | { 46 | "cell_type": "code", 47 | "execution_count": null, 48 | "metadata": {}, 49 | "outputs": [], 50 | "source": [ 51 | "\n", 52 | "plt.scatter(X, y)\n", 53 | "plt.xlabel('X')\n", 54 | "plt.ylabel('y')" 55 | ] 56 | }, 57 | { 58 | "cell_type": "markdown", 59 | "metadata": {}, 60 | "source": [] 61 | }, 62 | { 63 | "cell_type": "markdown", 64 | "metadata": {}, 65 | "source": [ 66 | "## Gradient Descent" 67 | ] 68 | }, 69 | { 70 | "cell_type": "code", 71 | "execution_count": null, 72 | "metadata": {}, 73 | "outputs": [], 74 | "source": [ 75 | "# Define the learning rate and number of iterations\n", 76 | "learning_rate = 0.1\n", 77 | "n_iterations = 10\n", 78 | "\n", 79 | "# Add a column of ones to X for the bias term\n", 80 | "X_b = np.c_[np.ones((100, 1)), X]\n", 81 | "\n", 82 | "# Function to compute the loss (mean squared error)\n", 83 | "def compute_loss(theta, X, y):\n", 84 | " error = y - X.dot(theta)\n", 85 | " loss = np.mean(error**2)\n", 86 | " return loss\n", 87 | "\n", 88 | "# Function to compute the gradients\n", 89 | "def compute_gradients(theta, X, y):\n", 90 | " gradients = -2/X.shape[0] * X.T.dot(y - X.dot(theta))\n", 91 | " return gradients\n", 92 | "\n", 93 | "# Function to perform gradient descent\n", 94 | "def gradient_descent(X, y, learning_rate, n_iterations):\n", 95 | " theta = np.random.randn(2,1) # Random initialization of parameters\n", 96 | " theta_trajectory = []\n", 97 | " losses = []\n", 98 | " for iteration in range(n_iterations):\n", 99 | " gradients = compute_gradients(theta, X, y)\n", 100 | " theta = theta - learning_rate * gradients\n", 101 | " theta_trajectory.append(theta)\n", 102 | " losses.append(compute_loss(theta, X, y))\n", 103 | "\n", 104 | " plt.figure()\n", 105 | "\n", 106 | " plt.scatter(X[:,-1], y)\n", 107 | " plt.plot(X[:,-1], X.dot(theta), color='red')\n", 108 | " plt.xlabel('X')\n", 109 | " plt.ylabel('y')\n", 110 | " plt.title(f'Gradient Descent Linear Regression : Iter {iteration}')\n", 111 | " return theta,theta_trajectory,losses\n", 112 | "\n", 113 | "# Perform gradient descent\n", 114 | "theta,theta_trajectory,losses = gradient_descent(X_b, y, learning_rate, n_iterations)\n", 115 | "\n", 116 | "# Print the parameters obtained by gradient descent\n", 117 | "print(\"Parameters obtained by gradient descent:\", theta)\n", 118 | "\n", 119 | "# Plot the data and the linear regression line\n", 120 | "\n", 121 | "#plt.show()\n" 122 | ] 123 | }, 124 | { 125 | "cell_type": "markdown", 126 | "metadata": {}, 127 | "source": [ 128 | "## Loss Surface" 129 | ] 130 | }, 131 | { 132 | "cell_type": "code", 133 | "execution_count": null, 134 | "metadata": {}, 135 | "outputs": [], 136 | "source": [ 137 | "\n", 138 | "\n", 139 | "theta0_vals = np.linspace(-10, 10, 100)\n", 140 | "theta1_vals = np.linspace(-10, 10, 100)\n", 141 | "theta0_mesh, theta1_mesh = np.meshgrid(theta0_vals, theta1_vals)\n", 142 | "loss_surface = np.zeros_like(theta0_mesh)\n", 143 | "for i in range(len(theta0_vals)):\n", 144 | " for j in range(len(theta1_vals)):\n", 145 | " theta_ij = np.array([[theta0_mesh[i,j]], [theta1_mesh[i,j]]])\n", 146 | " loss_surface[i,j] = compute_loss(theta_ij, X_b, y)\n", 147 | "\n", 148 | "fig = plt.figure()\n", 149 | "ax = fig.add_subplot(111, projection='3d')\n", 150 | "ax.plot_surface(theta0_mesh, theta1_mesh, loss_surface, cmap='viridis')\n", 151 | "ax.set_xlabel('Theta 0')\n", 152 | "ax.set_ylabel('Theta 1')\n", 153 | "ax.set_zlabel('Loss')\n", 154 | "ax.set_title('Loss Surface')\n", 155 | "plt.show()" 156 | ] 157 | }, 158 | { 159 | "cell_type": "markdown", 160 | "metadata": {}, 161 | "source": [ 162 | "## Learning Trajectory" 163 | ] 164 | }, 165 | { 166 | "cell_type": "code", 167 | "execution_count": null, 168 | "metadata": {}, 169 | "outputs": [], 170 | "source": [ 171 | "# Plot the loss surface\n", 172 | "theta0_vals = np.linspace(-10, 10, 100)\n", 173 | "theta1_vals = np.linspace(-10, 10, 100)\n", 174 | "theta0_mesh, theta1_mesh = np.meshgrid(theta0_vals, theta1_vals)\n", 175 | "loss_surface = np.zeros_like(theta0_mesh)\n", 176 | "for i in range(len(theta0_vals)):\n", 177 | " for j in range(len(theta1_vals)):\n", 178 | " theta_ij = np.array([[theta0_mesh[i,j]], [theta1_mesh[i,j]]])\n", 179 | " loss_surface[i,j] = compute_loss(theta_ij, X_b, y)\n", 180 | "\n", 181 | "# Plot the trajectory\n", 182 | "theta_trajectory = np.array(theta_trajectory).squeeze()\n", 183 | "fig = plt.figure()\n", 184 | "ax = fig.add_subplot(111, projection='3d')\n", 185 | "ax.plot_surface(theta0_mesh, theta1_mesh, loss_surface, cmap='viridis', alpha=0.5)\n", 186 | "ax.plot(theta_trajectory[:,0], theta_trajectory[:,1], losses, color='red', marker='o')\n", 187 | "ax.set_xlabel('Theta 0')\n", 188 | "ax.set_ylabel('Theta 1')\n", 189 | "ax.set_zlabel('Loss')\n", 190 | "ax.set_title('Gradient Descent Trajectory')\n", 191 | "plt.show()" 192 | ] 193 | }, 194 | { 195 | "cell_type": "markdown", 196 | "metadata": {}, 197 | "source": [ 198 | "## Mini-Batch Training" 199 | ] 200 | }, 201 | { 202 | "cell_type": "code", 203 | "execution_count": null, 204 | "metadata": {}, 205 | "outputs": [], 206 | "source": [ 207 | "\n", 208 | "\n", 209 | "# Define the learning rate and number of iterations\n", 210 | "learning_rate = 0.1\n", 211 | "n_iterations = 2\n", 212 | "batch_size = 20 # Mini-batch size\n", 213 | "\n", 214 | "# Function to compute the loss (mean squared error)\n", 215 | "def compute_loss(theta, X, y):\n", 216 | " error = y - X.dot(theta)\n", 217 | " loss = np.mean(error**2)\n", 218 | " return loss\n", 219 | "\n", 220 | "# Function to compute the gradients using a mini-batch\n", 221 | "def compute_gradients(theta, X_batch, y_batch):\n", 222 | " gradients = -2/X_batch.shape[0] * X_batch.T.dot(y_batch - X_batch.dot(theta))\n", 223 | " return gradients\n", 224 | "\n", 225 | "# Function to perform gradient descent with mini-batch training\n", 226 | "def gradient_descent(X, y, learning_rate, n_iterations, batch_size):\n", 227 | " theta = np.random.randn(2,1) # Random initialization of parameters\n", 228 | " theta_trajectory = [theta]\n", 229 | " loss = compute_loss(theta, X, y)\n", 230 | " losses = [loss ]\n", 231 | " m = len(X)\n", 232 | " for iteration in range(n_iterations):\n", 233 | " shuffled_indices = np.random.permutation(m)\n", 234 | " X_shuffled = X[shuffled_indices]\n", 235 | " y_shuffled = y[shuffled_indices]\n", 236 | " for i in range(0, m, batch_size):\n", 237 | " X_batch = X_shuffled[i:i+batch_size]\n", 238 | " y_batch = y_shuffled[i:i+batch_size]\n", 239 | " gradients = compute_gradients(theta, X_batch, y_batch)\n", 240 | " theta = theta - learning_rate * gradients\n", 241 | " loss = compute_loss(theta, X, y)\n", 242 | " theta_trajectory.append(theta)\n", 243 | " losses.append(loss)\n", 244 | " plt.figure()\n", 245 | "\n", 246 | " plt.scatter(X[:,-1], y)\n", 247 | " plt.plot(X[:,-1], X.dot(theta), color='red')\n", 248 | " plt.xlabel('X')\n", 249 | " plt.ylabel('y')\n", 250 | " plt.title(f'Gradient Descent Linear Regression : Iteration {iteration} Batch {i}')\n", 251 | " \n", 252 | " return theta_trajectory, losses\n", 253 | "\n", 254 | "# Perform gradient descent with mini-batch training\n", 255 | "theta_trajectory,losses = gradient_descent(X_b, y, learning_rate, n_iterations, batch_size)\n", 256 | "\n", 257 | "\n" 258 | ] 259 | }, 260 | { 261 | "cell_type": "code", 262 | "execution_count": null, 263 | "metadata": {}, 264 | "outputs": [], 265 | "source": [ 266 | "# Plot the loss surface\n", 267 | "theta0_vals = np.linspace(-10, 10, 100)\n", 268 | "theta1_vals = np.linspace(-10, 10, 100)\n", 269 | "theta0_mesh, theta1_mesh = np.meshgrid(theta0_vals, theta1_vals)\n", 270 | "loss_surface = np.zeros_like(theta0_mesh)\n", 271 | "for i in range(len(theta0_vals)):\n", 272 | " for j in range(len(theta1_vals)):\n", 273 | " theta_ij = np.array([[theta0_mesh[i,j]], [theta1_mesh[i,j]]])\n", 274 | " loss_surface[i,j] = compute_loss(theta_ij, X_b, y)\n", 275 | "\n", 276 | "# Plot the trajectory\n", 277 | "theta_trajectory = np.array(theta_trajectory).squeeze()\n", 278 | "fig = plt.figure()\n", 279 | "ax = fig.add_subplot(111, projection='3d')\n", 280 | "ax.plot_surface(theta0_mesh, theta1_mesh, loss_surface, cmap='viridis', alpha=0.5)\n", 281 | "ax.plot(theta_trajectory[:,0], theta_trajectory[:,1], losses, color='red', marker='o')\n", 282 | "ax.set_xlabel('Theta 0')\n", 283 | "ax.set_ylabel('Theta 1')\n", 284 | "ax.set_zlabel('Loss')\n", 285 | "ax.set_title('Gradient Descent Trajectory with Mini-Batch Training')\n", 286 | "plt.show()" 287 | ] 288 | } 289 | ], 290 | "metadata": { 291 | "kernelspec": { 292 | "display_name": "base", 293 | "language": "python", 294 | "name": "python3" 295 | }, 296 | "language_info": { 297 | "codemirror_mode": { 298 | "name": "ipython", 299 | "version": 3 300 | }, 301 | "file_extension": ".py", 302 | "mimetype": "text/x-python", 303 | "name": "python", 304 | "nbconvert_exporter": "python", 305 | "pygments_lexer": "ipython3", 306 | "version": "3.11.5" 307 | } 308 | }, 309 | "nbformat": 4, 310 | "nbformat_minor": 2 311 | } 312 | -------------------------------------------------------------------------------- /Notebooks/Neural Network from Scratch.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "metadata": {}, 6 | "source": [ 7 | "## Neural Network From Scratch\n", 8 | "\n", 9 | "by Rina Buoy, PhD" 10 | ] 11 | }, 12 | { 13 | "cell_type": "markdown", 14 | "metadata": {}, 15 | "source": [ 16 | "This simple neural network model demonstrates:\n", 17 | "\n", 18 | "1. Network design with one hidden layer.\n", 19 | "\n", 20 | "2. Forward propagation to compute activations.\n", 21 | "\n", 22 | "3. Binary cross-entropy loss computation.\n", 23 | "\n", 24 | "4. Backward propagation for gradient computation.\n", 25 | "\n", 26 | "5. Parameter updates using gradient descent.\n", 27 | "\n", 28 | "This setup can classify points into two classes based on the relationship between X[:, 0] and X[:, 1]. Adjusting the number of nodes, layers, or epochs can improve accuracy." 29 | ] 30 | }, 31 | { 32 | "cell_type": "markdown", 33 | "metadata": {}, 34 | "source": [ 35 | "#### Step 1: Set up the imports" 36 | ] 37 | }, 38 | { 39 | "cell_type": "code", 40 | "execution_count": 2, 41 | "metadata": {}, 42 | "outputs": [], 43 | "source": [ 44 | "import numpy as np\n", 45 | "import matplotlib.pyplot as plt" 46 | ] 47 | }, 48 | { 49 | "cell_type": "markdown", 50 | "metadata": {}, 51 | "source": [ 52 | "### Step 2: Generate Sample Data" 53 | ] 54 | }, 55 | { 56 | "cell_type": "code", 57 | "execution_count": 3, 58 | "metadata": {}, 59 | "outputs": [], 60 | "source": [ 61 | "np.random.seed(42) # For reproducibility\n", 62 | "\n", 63 | "# Generate 100 random points for two classes\n", 64 | "X = np.random.randn(100, 2)\n", 65 | "y = (X[:, 0] * X[:, 1] > 0).astype(int) # Points where x*y > 0 are in class 1\n", 66 | "y = y.reshape(-1, 1)" 67 | ] 68 | }, 69 | { 70 | "cell_type": "code", 71 | "execution_count": 4, 72 | "metadata": {}, 73 | "outputs": [ 74 | { 75 | "data": { 76 | "text/plain": [ 77 | "Text(0.5, 1.0, 'A binary classification with 2 features')" 78 | ] 79 | }, 80 | "execution_count": 4, 81 | "metadata": {}, 82 | "output_type": "execute_result" 83 | }, 84 | { 85 | "data": { 86 | "image/png": "", 87 | "text/plain": [ 88 | "
" 89 | ] 90 | }, 91 | "metadata": {}, 92 | "output_type": "display_data" 93 | } 94 | ], 95 | "source": [ 96 | "import matplotlib.pyplot as plt\n", 97 | "\n", 98 | "plt.scatter(X[:,0],X[:,1], c=y)\n", 99 | "plt.xlabel('X1')\n", 100 | "plt.ylabel('X2')\n", 101 | "plt.title('A binary classification with 2 features')\n", 102 | "\n" 103 | ] 104 | }, 105 | { 106 | "cell_type": "markdown", 107 | "metadata": {}, 108 | "source": [ 109 | "### Step 3: Define the Neural Network Structure\n", 110 | "\n", 111 | "We’ll use a neural network with:\n", 112 | "\n", 113 | "Input layer of 2 nodes (for 2 features),\n", 114 | "1 hidden layer with 4 nodes,\n", 115 | "Output layer with 1 node (for binary classification)." 116 | ] 117 | }, 118 | { 119 | "cell_type": "code", 120 | "execution_count": 5, 121 | "metadata": {}, 122 | "outputs": [], 123 | "source": [ 124 | "# Define network dimensions\n", 125 | "input_dim = 2\n", 126 | "hidden_dim = 4\n", 127 | "output_dim = 1\n", 128 | "\n", 129 | "# Initialize weights and biases with small random values\n", 130 | "W1 = np.random.randn(input_dim, hidden_dim) * 0.01\n", 131 | "b1 = np.zeros((1, hidden_dim))\n", 132 | "W2 = np.random.randn(hidden_dim, output_dim) * 0.01\n", 133 | "b2 = np.zeros((1, output_dim))\n" 134 | ] 135 | }, 136 | { 137 | "cell_type": "markdown", 138 | "metadata": {}, 139 | "source": [ 140 | "#### Step 4: Define Activation and Loss Functions\n", 141 | "\n", 142 | "We’ll use the ReLU activation for the hidden layer and sigmoid for the output layer." 143 | ] 144 | }, 145 | { 146 | "cell_type": "code", 147 | "execution_count": 6, 148 | "metadata": {}, 149 | "outputs": [], 150 | "source": [ 151 | "def sigmoid(x):\n", 152 | " return 1 / (1 + np.exp(-x))\n", 153 | "\n", 154 | "def sigmoid_derivative(x):\n", 155 | " return sigmoid(x) * (1 - sigmoid(x))\n", 156 | "\n", 157 | "def relu(x):\n", 158 | " return np.maximum(0, x)\n", 159 | "\n", 160 | "def relu_derivative(x):\n", 161 | " return (x > 0).astype(float)\n", 162 | "\n", 163 | "def binary_cross_entropy(predictions, targets):\n", 164 | " # Binary cross-entropy loss\n", 165 | " m = targets.shape[0]\n", 166 | " return -np.mean(targets * np.log(predictions + 1e-9) + (1 - targets) * np.log(1 - predictions + 1e-9))\n" 167 | ] 168 | }, 169 | { 170 | "cell_type": "markdown", 171 | "metadata": {}, 172 | "source": [ 173 | "#### Step 5: Forward Propagation\n", 174 | "\n", 175 | "Compute the activations for each layer in the network." 176 | ] 177 | }, 178 | { 179 | "cell_type": "code", 180 | "execution_count": 7, 181 | "metadata": {}, 182 | "outputs": [], 183 | "source": [ 184 | "def forward_propagation(X):\n", 185 | " # Hidden layer\n", 186 | " Z1 = np.dot(X, W1) + b1\n", 187 | " A1 = relu(Z1)\n", 188 | " \n", 189 | " # Output layer\n", 190 | " Z2 = np.dot(A1, W2) + b2\n", 191 | " A2 = sigmoid(Z2)\n", 192 | " \n", 193 | " return Z1, A1, Z2, A2\n" 194 | ] 195 | }, 196 | { 197 | "cell_type": "markdown", 198 | "metadata": {}, 199 | "source": [ 200 | "#### Step 6: Backward Propagation\n", 201 | "Compute gradients of weights and biases." 202 | ] 203 | }, 204 | { 205 | "cell_type": "code", 206 | "execution_count": 8, 207 | "metadata": {}, 208 | "outputs": [], 209 | "source": [ 210 | "def backward_propagation(X, y, Z1, A1, Z2, A2):\n", 211 | " m = X.shape[0]\n", 212 | " \n", 213 | " # Output layer gradients\n", 214 | " dZ2 = A2 - y\n", 215 | " dW2 = (1 / m) * np.dot(A1.T, dZ2)\n", 216 | " db2 = (1 / m) * np.sum(dZ2, axis=0, keepdims=True)\n", 217 | " \n", 218 | " # Hidden layer gradients\n", 219 | " dA1 = np.dot(dZ2, W2.T)\n", 220 | " dZ1 = dA1 * relu_derivative(Z1)\n", 221 | " dW1 = (1 / m) * np.dot(X.T, dZ1)\n", 222 | " db1 = (1 / m) * np.sum(dZ1, axis=0, keepdims=True)\n", 223 | " \n", 224 | " return dW1, db1, dW2, db2\n" 225 | ] 226 | }, 227 | { 228 | "cell_type": "markdown", 229 | "metadata": {}, 230 | "source": [ 231 | "#### Step 7: Gradient Descent Update" 232 | ] 233 | }, 234 | { 235 | "cell_type": "code", 236 | "execution_count": 9, 237 | "metadata": {}, 238 | "outputs": [], 239 | "source": [ 240 | "learning_rate = 0.1\n", 241 | "\n", 242 | "def update_parameters(W1, b1, W2, b2, dW1, db1, dW2, db2, learning_rate):\n", 243 | " W1 -= learning_rate * dW1\n", 244 | " b1 -= learning_rate * db1\n", 245 | " W2 -= learning_rate * dW2\n", 246 | " b2 -= learning_rate * db2\n", 247 | " return W1, b1, W2, b2\n" 248 | ] 249 | }, 250 | { 251 | "cell_type": "markdown", 252 | "metadata": {}, 253 | "source": [ 254 | "#### Step 8: Training Loop\n", 255 | "\n", 256 | "Now we’ll combine everything and run a training loop for several epochs." 257 | ] 258 | }, 259 | { 260 | "cell_type": "code", 261 | "execution_count": 10, 262 | "metadata": {}, 263 | "outputs": [ 264 | { 265 | "name": "stdout", 266 | "output_type": "stream", 267 | "text": [ 268 | "Epoch 0, Loss: 0.6932\n", 269 | "Epoch 100, Loss: 0.6922\n", 270 | "Epoch 200, Loss: 0.6912\n", 271 | "Epoch 300, Loss: 0.6854\n", 272 | "Epoch 400, Loss: 0.6610\n", 273 | "Epoch 500, Loss: 0.6253\n", 274 | "Epoch 600, Loss: 0.5914\n", 275 | "Epoch 700, Loss: 0.5485\n", 276 | "Epoch 800, Loss: 0.5043\n", 277 | "Epoch 900, Loss: 0.4531\n" 278 | ] 279 | } 280 | ], 281 | "source": [ 282 | "epochs = 1000\n", 283 | "\n", 284 | "for epoch in range(epochs):\n", 285 | " # Forward propagation\n", 286 | " Z1, A1, Z2, A2 = forward_propagation(X)\n", 287 | " \n", 288 | " # Compute loss\n", 289 | " loss = binary_cross_entropy(A2, y)\n", 290 | " \n", 291 | " # Backward propagation\n", 292 | " dW1, db1, dW2, db2 = backward_propagation(X, y, Z1, A1, Z2, A2)\n", 293 | " \n", 294 | " # Update parameters\n", 295 | " W1, b1, W2, b2 = update_parameters(W1, b1, W2, b2, dW1, db1, dW2, db2, learning_rate)\n", 296 | " \n", 297 | " # Print loss every 100 epochs\n", 298 | " if epoch % 100 == 0:\n", 299 | " print(f\"Epoch {epoch}, Loss: {loss:.4f}\")\n" 300 | ] 301 | }, 302 | { 303 | "cell_type": "markdown", 304 | "metadata": {}, 305 | "source": [ 306 | "#### Step 9: Testing the Model\n", 307 | "\n", 308 | "After training, let’s test the model's accuracy." 309 | ] 310 | }, 311 | { 312 | "cell_type": "code", 313 | "execution_count": 11, 314 | "metadata": {}, 315 | "outputs": [ 316 | { 317 | "name": "stdout", 318 | "output_type": "stream", 319 | "text": [ 320 | "Training Accuracy: 84.00%\n" 321 | ] 322 | } 323 | ], 324 | "source": [ 325 | "def predict(X):\n", 326 | " _, _, _, A2 = forward_propagation(X)\n", 327 | " return (A2 > 0.5).astype(int)\n", 328 | "\n", 329 | "# Test accuracy on training data\n", 330 | "predictions = predict(X)\n", 331 | "accuracy = np.mean(predictions == y) * 100\n", 332 | "print(f\"Training Accuracy: {accuracy:.2f}%\")\n" 333 | ] 334 | }, 335 | { 336 | "cell_type": "markdown", 337 | "metadata": {}, 338 | "source": [ 339 | "#### Additional: Model Parameter Count and FLOPs\n", 340 | "\n", 341 | "1. Parameter Count: The total number of parameters in a neural network is the sum of the number of weights and biases for each layer.\n", 342 | "\n", 343 | "2. FLOP Count: The FLOPs for a fully connected layer are calculated based on the number of multiplications and additions. Each weight requires a multiplication with an input and an addition to the output for each neuron in the layer.\n", 344 | "\n" 345 | ] 346 | }, 347 | { 348 | "cell_type": "code", 349 | "execution_count": 12, 350 | "metadata": {}, 351 | "outputs": [ 352 | { 353 | "name": "stdout", 354 | "output_type": "stream", 355 | "text": [ 356 | "Total Parameters: 17\n", 357 | "Total FLOPs per forward pass: 32\n" 358 | ] 359 | } 360 | ], 361 | "source": [ 362 | "def count_parameters():\n", 363 | " total_params = 0\n", 364 | " total_params += W1.size + b1.size # Parameters for first layer\n", 365 | " total_params += W2.size + b2.size # Parameters for second layer\n", 366 | " return total_params\n", 367 | "\n", 368 | "def count_flops(X):\n", 369 | " # FLOPs for fully connected layers = 2 * (input_size * output_size)\n", 370 | " # This accounts for multiplications and additions\n", 371 | " \n", 372 | " flops = 0\n", 373 | " \n", 374 | " # FLOPs for first layer\n", 375 | " input_size = X.shape[1]\n", 376 | " hidden_size = W1.shape[1]\n", 377 | " flops += 2 * input_size * hidden_size # Multiplications and additions\n", 378 | " \n", 379 | " # FLOPs for ReLU activations (just comparisons, typically count as 1 FLOP each)\n", 380 | " flops += hidden_size\n", 381 | " \n", 382 | " # FLOPs for second layer\n", 383 | " flops += 2 * hidden_size * W2.shape[1]\n", 384 | " \n", 385 | " # FLOPs for sigmoid activation in output layer\n", 386 | " flops += W2.shape[1] * 4 # Sigmoid (multiplications, divisions, exponentiation)\n", 387 | " \n", 388 | " return flops\n", 389 | "\n", 390 | "# Example usage:\n", 391 | "print(f\"Total Parameters: {count_parameters()}\")\n", 392 | "print(f\"Total FLOPs per forward pass: {count_flops(X)}\")\n" 393 | ] 394 | }, 395 | { 396 | "cell_type": "markdown", 397 | "metadata": {}, 398 | "source": [ 399 | "Generally, the FLOPs for backpropagation are about twice as much as the forward pass because:\n", 400 | "\n", 401 | "Gradient Computation: The gradients for weights, biases, and activations require both multiplications and additions similar to the forward pass.\n", 402 | "Chain Rule Application: Additional operations are needed to propagate the error backward.\n", 403 | "Here’s an approximate breakdown of the FLOPs required for each layer in the backward pass:\n", 404 | "\n", 405 | "1. Output Layer:\n", 406 | "\n", 407 | "Gradient of Loss w.r.t Output: Similar to forward pass FLOPs.\n", 408 | "Gradient w.r.t Weights and Biases: Roughly equivalent to forward pass for each parameter.\n", 409 | "Propagation of Error to Previous Layer: Similar in complexity to forward pass.\n", 410 | "\n", 411 | "2. Hidden Layer:\n", 412 | "\n", 413 | "Gradient w.r.t Activations: Similar to the forward pass, plus the application of the derivative of the activation function (e.g., ReLU or sigmoid).\n", 414 | "Gradient w.r.t Weights and Biases: Similar to forward pass.\n", 415 | "Propagation of Error: Similar to forward pass.\n", 416 | "Using these principles, here’s an approximate calculation of FLOPs for the backward pass:" 417 | ] 418 | }, 419 | { 420 | "cell_type": "code", 421 | "execution_count": 13, 422 | "metadata": {}, 423 | "outputs": [ 424 | { 425 | "name": "stdout", 426 | "output_type": "stream", 427 | "text": [ 428 | "Total FLOPs for backward pass: 53\n" 429 | ] 430 | } 431 | ], 432 | "source": [ 433 | "def count_backward_flops(X):\n", 434 | " # Backward FLOPs calculation for each layer\n", 435 | " flops = 0\n", 436 | "\n", 437 | " # Output layer FLOPs\n", 438 | " hidden_size = W1.shape[1]\n", 439 | " output_size = W2.shape[1]\n", 440 | " \n", 441 | " # Gradient of loss with respect to A2\n", 442 | " flops += output_size # For binary cross-entropy loss\n", 443 | "\n", 444 | " # Gradient of output layer weights and biases\n", 445 | " flops += 2 * hidden_size * output_size # Gradient of W2 and bias (multiplies and additions)\n", 446 | "\n", 447 | " # Propagating gradient back to hidden layer (similar to forward pass)\n", 448 | " flops += 2 * hidden_size * output_size\n", 449 | "\n", 450 | " # Hidden layer FLOPs\n", 451 | " input_size = X.shape[1]\n", 452 | " \n", 453 | " # Gradient with respect to A1, involving the derivative of ReLU\n", 454 | " flops += hidden_size # ReLU derivatives (1 comparison per neuron)\n", 455 | "\n", 456 | " # Gradient of hidden layer weights and biases\n", 457 | " flops += 2 * input_size * hidden_size # Gradient of W1 and bias (multiplies and additions)\n", 458 | " \n", 459 | " # Propagation of gradient back to input layer\n", 460 | " flops += 2 * input_size * hidden_size\n", 461 | "\n", 462 | " return flops\n", 463 | "\n", 464 | "# Example usage:\n", 465 | "print(f\"Total FLOPs for backward pass: {count_backward_flops(X)}\")\n" 466 | ] 467 | }, 468 | { 469 | "cell_type": "markdown", 470 | "metadata": {}, 471 | "source": [ 472 | "#### Next ?\n", 473 | "\n", 474 | "What if we add additional hidden layers ?\n", 475 | "\n", 476 | "What if we use different activation function ?\n", 477 | "\n", 478 | "What if we use a linear regression loss ?" 479 | ] 480 | } 481 | ], 482 | "metadata": { 483 | "kernelspec": { 484 | "display_name": "base", 485 | "language": "python", 486 | "name": "python3" 487 | }, 488 | "language_info": { 489 | "codemirror_mode": { 490 | "name": "ipython", 491 | "version": 3 492 | }, 493 | "file_extension": ".py", 494 | "mimetype": "text/x-python", 495 | "name": "python", 496 | "nbconvert_exporter": "python", 497 | "pygments_lexer": "ipython3", 498 | "version": "3.11.5" 499 | } 500 | }, 501 | "nbformat": 4, 502 | "nbformat_minor": 2 503 | } 504 | -------------------------------------------------------------------------------- /Notebooks/Regularization and Cross-Validation.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "code", 5 | "execution_count": null, 6 | "metadata": {}, 7 | "outputs": [], 8 | "source": [] 9 | }, 10 | { 11 | "cell_type": "markdown", 12 | "metadata": {}, 13 | "source": [ 14 | "# Linear Regression with Cross-Validation and Regularization\n", 15 | "\n", 16 | "In this demo, we will explore two important concepts in machine learning: **Cross-Validation** and **Regularization**. We will use the `scikit-learn` package to perform these tasks.\n", 17 | "\n", 18 | "### Cross-Validation:\n", 19 | "Cross-validation is a technique for evaluating machine learning models by splitting the dataset into training and test sets multiple times to ensure that the model's performance generalizes well to unseen data. One common approach is **k-fold cross-validation**, where the data is split into `k` subsets, and the model is trained on `k-1` subsets while the remaining subset is used for validation. This process is repeated `k` times, and the average performance is taken.\n", 20 | "\n", 21 | "### Regularization:\n", 22 | "Regularization techniques add a penalty to the cost function of a machine learning model to prevent overfitting. We focus on two types of regularization:\n", 23 | "- **Ridge Regression (L2 Regularization)**: Adds a penalty proportional to the square of the coefficients.\n", 24 | " \n", 25 | " $\n", 26 | " J(\\theta) = \\frac{1}{2m} \\sum_{i=1}^{m} \\left( \\hat{y}^{(i)} - y^{(i)} \\right)^2 + \\lambda \\sum_{j=1}^{n} \\theta_j^2\n", 27 | "$\n", 28 | "\n", 29 | "- **Lasso Regression (L1 Regularization)**: Adds a penalty proportional to the absolute value of the coefficients.\n", 30 | "\n", 31 | " $\n", 32 | " J(\\theta) = \\frac{1}{2m} \\sum_{i=1}^{m} \\left( \\hat{y}^{(i)} - y^{(i)} \\right)^2 + \\lambda \\sum_{j=1}^{n} |\\theta_j|\n", 33 | " $\n", 34 | "\n", 35 | "The parameter $\\lambda$ (also known as `alpha` in `scikit-learn`) controls the strength of regularization: higher values increase the penalty and thus shrink the model coefficients.\n" 36 | ] 37 | }, 38 | { 39 | "cell_type": "code", 40 | "execution_count": 1, 41 | "metadata": {}, 42 | "outputs": [ 43 | { 44 | "name": "stdout", 45 | "output_type": "stream", 46 | "text": [ 47 | "Linear Regression (no regularization) 5-fold cross-validation R^2 scores: [1. 1. 1. 1. 1.]\n", 48 | "Average R^2: 1.0\n", 49 | "\n", 50 | "Ridge Regression (L2) 5-fold cross-validation R^2 scores: [0.99840327 0.9979706 0.99798774 0.99762316 0.99803145]\n", 51 | "Average R^2: 0.9980032443503974\n", 52 | "\n", 53 | "Lasso Regression (L1) 5-fold cross-validation R^2 scores: [0.99212177 0.98990394 0.98996858 0.9882734 0.99021121]\n", 54 | "Average R^2: 0.9900957787734809\n" 55 | ] 56 | }, 57 | { 58 | "data": { 59 | "text/html": [ 60 | "
LinearRegression()
In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.
" 465 | ], 466 | "text/plain": [ 467 | "LinearRegression()" 468 | ] 469 | }, 470 | "execution_count": 1, 471 | "metadata": {}, 472 | "output_type": "execute_result" 473 | } 474 | ], 475 | "source": [ 476 | "import numpy as np\n", 477 | "import matplotlib.pyplot as plt\n", 478 | "from sklearn.linear_model import LinearRegression, Ridge, Lasso\n", 479 | "from sklearn.model_selection import cross_val_score, train_test_split\n", 480 | "\n", 481 | "# Generate synthetic data for the demo\n", 482 | "np.random.seed(0)\n", 483 | "X = 2 * np.random.rand(100, 1)\n", 484 | "y = 4 + 3 * X + np.random.randn(100, 1).ravel()\n", 485 | "\n", 486 | "# Split the data into training and testing sets\n", 487 | "X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)\n", 488 | "\n", 489 | "# Cross-validation with a simple Linear Regression (no regularization)\n", 490 | "lin_reg = LinearRegression()\n", 491 | "\n", 492 | "# Perform 5-fold cross-validation and compute the average R^2 score\n", 493 | "scores = cross_val_score(lin_reg, X_train, y_train, cv=5, scoring='r2')\n", 494 | "print(f\"Linear Regression (no regularization) 5-fold cross-validation R^2 scores: {scores}\")\n", 495 | "print(f\"Average R^2: {scores.mean()}\")\n", 496 | "\n", 497 | "# Ridge Regression (L2 Regularization)\n", 498 | "ridge_reg = Ridge(alpha=1.0) # alpha is the regularization strength\n", 499 | "\n", 500 | "# Perform cross-validation for Ridge\n", 501 | "ridge_scores = cross_val_score(ridge_reg, X_train, y_train, cv=5, scoring='r2')\n", 502 | "print(f\"\\nRidge Regression (L2) 5-fold cross-validation R^2 scores: {ridge_scores}\")\n", 503 | "print(f\"Average R^2: {ridge_scores.mean()}\")\n", 504 | "\n", 505 | "# Lasso Regression (L1 Regularization)\n", 506 | "lasso_reg = Lasso(alpha=0.1) # alpha is the regularization strength\n", 507 | "\n", 508 | "# Perform cross-validation for Lasso\n", 509 | "lasso_scores = cross_val_score(lasso_reg, X_train, y_train, cv=5, scoring='r2')\n", 510 | "print(f\"\\nLasso Regression (L1) 5-fold cross-validation R^2 scores: {lasso_scores}\")\n", 511 | "print(f\"Average R^2: {lasso_scores.mean()}\")\n", 512 | "\n", 513 | "# Train and compare models on the test set\n", 514 | "lin_reg\n" 515 | ] 516 | } 517 | ], 518 | "metadata": { 519 | "kernelspec": { 520 | "display_name": "base", 521 | "language": "python", 522 | "name": "python3" 523 | }, 524 | "language_info": { 525 | "codemirror_mode": { 526 | "name": "ipython", 527 | "version": 3 528 | }, 529 | "file_extension": ".py", 530 | "mimetype": "text/x-python", 531 | "name": "python", 532 | "nbconvert_exporter": "python", 533 | "pygments_lexer": "ipython3", 534 | "version": "3.11.5" 535 | } 536 | }, 537 | "nbformat": 4, 538 | "nbformat_minor": 2 539 | } 540 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | ![Course Image](https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/main/Course%20Image.png) 2 | 3 | 4 | # Practical Applications in Machine Learning 5 | This is a repository for PALM students at the Royal University of Phnom Penh (2024). The materials for this course are adapted from https://introml.mit.edu/. The contents are solely for educational purposes. 6 | 7 | (The below contents will be updated from time to time.) 8 | 9 | 10 | # Practical Applications in Machine Learning (PAML 2024) 11 | 12 | Welcome to the **PAML 2024**! This course will cover the foundation and practical applications in machine learning for undergraduate students. Below is the weekly breakdown of the course content, assignments, and key deliverables. 13 | 14 | ## Table of Contents 15 | 16 | | **Week** | **Topic** | **Description** | **Readings/Resources** | **Labs** | **Assignments** | 17 | |----------|------------|-----------------|-----------------------|-----------------|-----------------| 18 | | Topic 1 | Overview of ML | [Sldie](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Week%201/Intro_General.pdf) | [Link to Readings/Resources](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Reading%20Materials/Introduction.pdf)| [Python](https://faculty.washington.edu/otoomet/machinelearning-py/python.html); [Numpy & Pandas](https://faculty.washington.edu/otoomet/machinelearning-py/numpy-and-pandas.html); [Linear Algebra](https://faculty.washington.edu/otoomet/machinelearning-py/la.html) | [Week 1: Homework](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Homeworks/Week%201.ipynb) (Deadline: 30th Sept. 2024)| 19 | | Topic 2 | Linear Regression | [Slide](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Week%202/Lecture%202%20-%20Linear%20Regression%2C%20Regularization%20and%20Cross-Validation.pdf) | [Link to Readings/Resources](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Reading%20Materials/Linear%20Regression.pdf)| [Linear Regression](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Notebooks/Linear%20Regression.ipynb);[Regularization](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Notebooks/Regularization%20and%20Cross-Validation.ipynb) | Assignment 1 (Kaggle Competition)| 20 | | Topic 3 | Gradient Descent | [Slide](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Week%203/Lecture%203%20-%20Gradient%20Descent.pdf) |[Link to Readings/Resources](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Reading%20Materials/Gradient_Descent.pdf)| [Gradient Descent Lab](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Notebooks/Lab%203%20-%20Gradient%20Descent.ipynb) | [Homework 2](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Homeworks/Week%203%20-%20Homework%202%20-%20Public%20.pdf)| 21 | | Topic 4 | Linear Classification | [Slide](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Week%204/Lecture%204%20-%20Linear%20Classification.pdf) |[Link to Readings/Resources](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Reading%20Materials/Linear%20Classification.pdf)| [Linear Classification Lab](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Notebooks/Logistic%20Regression.ipynb) | [Homework 3](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Homeworks/Logistic%20Regression_Homework_Public.ipynb)| 22 | | Topic 5 | Feature Engineering | [Slide](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Week%205/Lecture%205%20-%20Feature%20Engineering.pdf) | [Link to Readings/Resources](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Reading%20Materials/Feature%20Representation.pdf); [Scikit-Learn](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Week%205/Addtional%20Material%20-%20Scikit-Learn.pdf) | [Feature Engineering Lab](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Notebooks/Feature%20Engineering.ipynb) | [Homework 4](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Homeworks/Scikit-Learn%20-%20Logistic%20Regression%20Homework_Public.ipynb); [Homework 5](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Homeworks/Scikit-Learn%20-%20Linear%20Regression%20Homework_Public.ipynb)| 23 | | Topic 6 | Neural Network | [Slide](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Week%206/Lecture%206%20-Neural%20Network.pdf) | [Link to Readings/Resources](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Reading%20Materials/Neural_Networks.pdf)| [Neural Network Lab](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Notebooks/Neural%20Network%20from%20Scratch.ipynb) | TBA| 24 | | Topic 7 | Autoencoder | [Slide](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Week%207/Lecture%207%20-%20Neural%20Network%20-%20AutoEncoder.pdf) | [Neural Net. Pt.2](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Reading%20Materials/Neural_Networks_Part%202.pdf)/[Link to Readings/Resources](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Reading%20Materials/Autoencoders.pdf) | [Autoencoder Lab](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Notebooks/Autoencoder.ipynb)| TBA| 25 | | Topic 8 | [Pytorch Tutorial](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Notebooks/PyTorch_Tutorial.ipynb) | 26 | | Topic 9 | Convolutional Neural Networks | [Slide](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Week%208/Lecture%208%20-%20Convolutional%20Neural%20Network.pdf) | [Reading Material](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Reading%20Materials/Convolutional_Neural_Networks.pdf) |[CNN Lab](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Notebooks/CNN%20Lab.ipynb) | TBA| 27 | | Topic 10 | Non-parametric Models | [Slide](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Topic%209/Lecture%209%20-%20Non-Parametric%20Models.pdf) | [Reading Material](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Reading%20Materials/Non-parametric%20methods.pdf) | [Decision Tree Lab](https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning/blob/main/Notebooks/Decision%20Tree.ipynb) | TBA| 28 | --- 29 | 30 | ## How to Use This Repository 31 | 32 | 1. **Clone the repository**: 33 | ```bash 34 | git clone https://github.com/rinabuoy/Practical-Applications-in-Machine-Learning.git 35 | cd Practical-Applications-in-Machine-Learning 36 | 37 | 38 | ## Additional Materials: 39 | 40 | **Textbooks** 41 | 42 | (1) [Speech and Language Processing (3rd ed. draft)](https://web.stanford.edu/~jurafsky/slp3/) 43 | 44 | (2) [Understanding Deep Learning](https://udlbook.github.io/udlbook/) 45 | 46 | (3) [Deep Learning: Foundations and Concepts](https://link.springer.com/book/10.1007/978-3-031-45468-4) 47 | 48 | (4) [Probabilistic Machine Learning: An Introduction](https://probml.github.io/pml-book/book1.html) 49 | 50 | (5) [Machine Learning with PyTorch and Scikit-Learn Book](https://github.com/rasbt/machine-learning-book) 51 | 52 | **Probability** 53 | 54 | (1) [CS229](https://cs229.stanford.edu/lectures-spring2022/cs229-probability_review.pdf) 55 | 56 | (2) [3Blue1Brown](https://www.youtube.com/watch?v=8idr1WZ1A7Q&list=PLZHQObOWTQDOjmo3Y6ADm0ScWAlEXf-fp) 57 | 58 | **Linear Algebra** 59 | 60 | (1) [CS229](https://cs229.stanford.edu/notes2024summer/cs229-linear_algebra.pdf) 61 | 62 | (2) [3Blue1Brown](https://www.youtube.com/watch?v=fNk_zzaMoSs&list=PLZHQObOWTQDPD3MizzM2xVFitgF8hE_ab) 63 | 64 | **Python** 65 | 66 | (1) [Python](https://colab.research.google.com/github/cs231n/cs231n.github.io/blob/master/python-colab.ipynb) 67 | 68 | (2) [Numpy](https://cs231n.github.io/python-numpy-tutorial/) 69 | 70 | (3) [Pytorch](https://colab.research.google.com/drive/1FERNv6t8xpX9Nly_JdnePWEPllI7F3Fx?usp=sharing) 71 | 72 | (4) [CS50](https://cs50.harvard.edu/python/2022/) 73 | 74 | (5) [How to Create and Publish Your Own Python Package](https://medium.com/@nydas/how-to-create-and-publish-your-own-python-package-8e4f3fd70506) 75 | 76 | **Neural Networks** 77 | 78 | (1) [3Blue1Brown](https://www.youtube.com/watch?v=aircAruvnKk&list=PLZHQObOWTQDNU6R1_67000Dx_ZCJB-3pi) 79 | 80 | (2) [Zero-to-Hero by Andrey Kaparthy](https://www.youtube.com/playlist?list=PLAqhIrjkxbuWI23v9cThsA9GvCAUhRvKZ) 81 | 82 | (3) [Visualizing transformers and attention | Talk for TNG Big Tech Day '24](https://www.youtube.com/watch?v=KJtZARuO3JY&t=313s) 83 | 84 | **HuggingFace** 85 | 86 | (1) [CS224N: Hugging Face Transformers Tutorial (Spring '24) ](https://colab.research.google.com/drive/13r94i6Fh4oYf-eJRSi7S_y_cen5NYkBm#scrollTo=9EhWoZef-X8u) 87 | 88 | 89 | 90 | **Other tools** 91 | 92 | (1) [Missing Semester (Git, Command-line)](https://missing.csail.mit.edu/) 93 | 94 | (2) [Llama 3.2 Running Locally in VSCode: How to Set It Up with CodeGPT and Ollama](https://medium.com/@dan.avila7/llama-3-2-running-locally-in-vscode-how-to-set-it-up-with-codegpt-and-olla-8d33fd29c195) 95 | 96 | (3) [How to run Ollama in Windows via WSL](https://medium.com/@Tanzim/how-to-run-ollama-in-windows-via-wsl-8ace765cee12) 97 | 98 | 99 | **Inspirational/ General Knowledge Videos** 100 | 101 | (1) [Invention of Blue LED](https://www.youtube.com/watch?v=AF8d72mA41M) 102 | 103 | (2) [Invention of QR Code](https://www.youtube.com/watch?v=w5ebcowAJD8) 104 | 105 | **License** 106 | 107 | This course content is licensed under the MIT License. 108 | 109 | 110 | 111 | 112 | -------------------------------------------------------------------------------- /Reading Materials/Autoencoders.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Reading Materials/Autoencoders.pdf -------------------------------------------------------------------------------- /Reading Materials/Convolutional_Neural_Networks.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Reading Materials/Convolutional_Neural_Networks.pdf -------------------------------------------------------------------------------- /Reading Materials/Feature Representation.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Reading Materials/Feature Representation.pdf -------------------------------------------------------------------------------- /Reading Materials/Gradient_Descent.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Reading Materials/Gradient_Descent.pdf -------------------------------------------------------------------------------- /Reading Materials/Introduction.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Reading Materials/Introduction.pdf -------------------------------------------------------------------------------- /Reading Materials/Linear Classification.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Reading Materials/Linear Classification.pdf -------------------------------------------------------------------------------- /Reading Materials/Linear Regression.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Reading Materials/Linear Regression.pdf -------------------------------------------------------------------------------- /Reading Materials/Neural_Networks.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Reading Materials/Neural_Networks.pdf -------------------------------------------------------------------------------- /Reading Materials/Neural_Networks_Part 2.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Reading Materials/Neural_Networks_Part 2.pdf -------------------------------------------------------------------------------- /Reading Materials/Non-parametric methods.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Reading Materials/Non-parametric methods.pdf -------------------------------------------------------------------------------- /Topic 1/Intro_General.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Topic 1/Intro_General.pdf -------------------------------------------------------------------------------- /Topic 2/Lecture 2 - Linear Regression, Regularization and Cross-Validation.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Topic 2/Lecture 2 - Linear Regression, Regularization and Cross-Validation.pdf -------------------------------------------------------------------------------- /Topic 3/Lecture 3 - Gradient Descent.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Topic 3/Lecture 3 - Gradient Descent.pdf -------------------------------------------------------------------------------- /Topic 4/Lecture 4 - Linear Classification.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Topic 4/Lecture 4 - Linear Classification.pdf -------------------------------------------------------------------------------- /Topic 5/Addtional Material - Scikit-Learn.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Topic 5/Addtional Material - Scikit-Learn.pdf -------------------------------------------------------------------------------- /Topic 5/Lecture 5 - Feature Engineering.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Topic 5/Lecture 5 - Feature Engineering.pdf -------------------------------------------------------------------------------- /Topic 6/Lecture 6 -Neural Network.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Topic 6/Lecture 6 -Neural Network.pdf -------------------------------------------------------------------------------- /Topic 7/Lecture 7 - Neural Network - AutoEncoder.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Topic 7/Lecture 7 - Neural Network - AutoEncoder.pdf -------------------------------------------------------------------------------- /Topic 8/Lecture 8 - Convolutional Neural Network.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Topic 8/Lecture 8 - Convolutional Neural Network.pdf -------------------------------------------------------------------------------- /Topic 9/Lecture 9 - Non-Parametric Models.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rinabuoy/Practical-Applications-in-Machine-Learning/828573933300184fc0d888b901a1a69de5658dbd/Topic 9/Lecture 9 - Non-Parametric Models.pdf -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- 1 | torch >= 2.0.1 # all 2 | jupyterlab >= 4.0 # all 3 | matplotlib >= 3.7.1 # ch04; ch05 4 | tqdm >= 4.66.1 # ch05; ch07 5 | numpy >= 1.25, < 2.0 # dependency of several other libraries like torch and pandas 6 | pandas >= 2.2.1 # ch06 7 | psutil >= 5.9.5 # ch07; already installed automatically as dependency of torch 8 | --------------------------------------------------------------------------------