├── 08. Object Detection ├── requirements.txt ├── Images │ ├── F9.jpg │ └── F9.mp4 ├── Dataset │ └── coco_classes.pickle └── README.md ├── 07. Pretrained CNNs ├── requirements.txt ├── Images │ └── Bal1.JPG └── README.md ├── 03. Image Classification ├── requirements.txt ├── Scripts │ └── simplepreprocessor.py ├── README.md └── Simplepreprocessor.ipynb ├── 01. OpenCV ├── requirements.txt ├── Images │ ├── MM.jpg │ ├── P.jpg │ ├── Bal1.JPG │ ├── Cat.jpg │ ├── Empire_cloudy1.jpg │ └── Empire_sunset1.jpg └── README.md ├── 04. Neural Networks ├── requirements.txt └── README.md ├── 02. ConvolutionalNeuralNetworks ├── requirements.txt ├── Images │ ├── Bal1.JPG │ └── Empire_cloudy1.jpg ├── README.md └── Convolutional Layers.ipynb ├── 05. LeNet Architecture ├── requirements.txt ├── README.md └── LeNet.ipynb ├── 06. VGGNet Architecture ├── requirements.txt ├── README.md └── Mini VGGNet.ipynb ├── LICENSE └── README.md /08. Object Detection/requirements.txt: -------------------------------------------------------------------------------- 1 | cv2 2 | numpy 3 | torch 4 | pickle -------------------------------------------------------------------------------- /07. Pretrained CNNs/requirements.txt: -------------------------------------------------------------------------------- 1 | cv2 2 | numpy 3 | tensorflow 4 | keras -------------------------------------------------------------------------------- /03. Image Classification/requirements.txt: -------------------------------------------------------------------------------- 1 | cv2 2 | imutils 3 | numpy 4 | matplotlib 5 | os -------------------------------------------------------------------------------- /01. OpenCV/requirements.txt: -------------------------------------------------------------------------------- 1 | cv2 2 | imutils 3 | numpy 4 | argparse 5 | matplotlib 6 | skimage -------------------------------------------------------------------------------- /04. Neural Networks/requirements.txt: -------------------------------------------------------------------------------- 1 | numpy 2 | sklearn 3 | tensorflow 4 | keras 5 | matplotlib 6 | -------------------------------------------------------------------------------- /02. ConvolutionalNeuralNetworks/requirements.txt: -------------------------------------------------------------------------------- 1 | cv2 2 | imutils 3 | numpy 4 | matplotlib 5 | skimage -------------------------------------------------------------------------------- /01. OpenCV/Images/MM.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ThinamXx/ComputerVision/HEAD/01. OpenCV/Images/MM.jpg -------------------------------------------------------------------------------- /01. OpenCV/Images/P.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ThinamXx/ComputerVision/HEAD/01. OpenCV/Images/P.jpg -------------------------------------------------------------------------------- /01. OpenCV/Images/Bal1.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ThinamXx/ComputerVision/HEAD/01. OpenCV/Images/Bal1.JPG -------------------------------------------------------------------------------- /01. OpenCV/Images/Cat.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ThinamXx/ComputerVision/HEAD/01. OpenCV/Images/Cat.jpg -------------------------------------------------------------------------------- /05. LeNet Architecture/requirements.txt: -------------------------------------------------------------------------------- 1 | cv2 2 | imutils 3 | numpy 4 | matplotlib 5 | skimage 6 | keras 7 | tensorflow -------------------------------------------------------------------------------- /08. Object Detection/Images/F9.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ThinamXx/ComputerVision/HEAD/08. Object Detection/Images/F9.jpg -------------------------------------------------------------------------------- /08. Object Detection/Images/F9.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ThinamXx/ComputerVision/HEAD/08. Object Detection/Images/F9.mp4 -------------------------------------------------------------------------------- /01. OpenCV/Images/Empire_cloudy1.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ThinamXx/ComputerVision/HEAD/01. OpenCV/Images/Empire_cloudy1.jpg -------------------------------------------------------------------------------- /01. OpenCV/Images/Empire_sunset1.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ThinamXx/ComputerVision/HEAD/01. OpenCV/Images/Empire_sunset1.jpg -------------------------------------------------------------------------------- /07. Pretrained CNNs/Images/Bal1.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ThinamXx/ComputerVision/HEAD/07. Pretrained CNNs/Images/Bal1.JPG -------------------------------------------------------------------------------- /06. VGGNet Architecture/requirements.txt: -------------------------------------------------------------------------------- 1 | cv2 2 | imutils 3 | numpy 4 | matplotlib 5 | skimage 6 | keras 7 | tensorflow 8 | scikit-learn -------------------------------------------------------------------------------- /02. ConvolutionalNeuralNetworks/Images/Bal1.JPG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ThinamXx/ComputerVision/HEAD/02. ConvolutionalNeuralNetworks/Images/Bal1.JPG -------------------------------------------------------------------------------- /08. Object Detection/Dataset/coco_classes.pickle: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ThinamXx/ComputerVision/HEAD/08. Object Detection/Dataset/coco_classes.pickle -------------------------------------------------------------------------------- /02. ConvolutionalNeuralNetworks/Images/Empire_cloudy1.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ThinamXx/ComputerVision/HEAD/02. ConvolutionalNeuralNetworks/Images/Empire_cloudy1.jpg -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- 1 | MIT License 2 | 3 | Copyright (c) 2021 Thinam Tamang 4 | 5 | Permission is hereby granted, free of charge, to any person obtaining a copy 6 | of this software and associated documentation files (the "Software"), to deal 7 | in the Software without restriction, including without limitation the rights 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 9 | copies of the Software, and to permit persons to whom the Software is 10 | furnished to do so, subject to the following conditions: 11 | 12 | The above copyright notice and this permission notice shall be included in all 13 | copies or substantial portions of the Software. 14 | 15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 21 | SOFTWARE. 22 | -------------------------------------------------------------------------------- /05. LeNet Architecture/README.md: -------------------------------------------------------------------------------- 1 | # **Computer Vision: LeNet Architecture** 2 | 3 | The [**LeNet Architecture**](https://github.com/ThinamXx/ComputerVision/blob/main/05.%20LeNet%20Architecture/LeNet.ipynb) notebook contains the implementation of LeNet Architecture. LeNet is a seminal work in the deep learning literature which demonstrates how neural networks could be trained to recognize objects in images without feture extraction. 4 | 5 | 📚**Notebooks:** 6 | - [**LeNet Notebook**](https://github.com/ThinamXx/ComputerVision/blob/main/05.%20LeNet%20Architecture/LeNet.ipynb) 7 | 8 | **LeNet** 9 | - I will define the build method of LeNet architecture below. It requires four parameters: width of input image, height of input image, depth of image, number of class labels in the classification task. The Sequential class, the building block of sequential networks sequentially stack one layer on top of the other layer initialized below. I have presented the implementation of LeNet Architecture, Training and Model Evaluation here in the snapshot. 10 | 11 | ![Image](https://github.com/ThinamXx/MachineLearning_DeepLearning/blob/main/Images/Day%2016a.PNG) 12 | ![Image](https://github.com/ThinamXx/MachineLearning_DeepLearning/blob/main/Images/Day%2016b.PNG) 13 | -------------------------------------------------------------------------------- /07. Pretrained CNNs/README.md: -------------------------------------------------------------------------------- 1 | # **Computer Vision: Pretrained Convolutional Neural Networks** 2 | 3 | - The [**Pretrained CNNs**](https://github.com/ThinamXx/ComputerVision/blob/main/07.%20Pretrained%20CNNs/PretrainedCNNs.ipynb) notebook contains the reviews of convolutional neural networks and implementation of VGG16 and Xception networks for classification of images. 4 | 5 | 📚**Notebook:** 6 | - [**Pretrained CNNs**](https://github.com/ThinamXx/ComputerVision/blob/main/07.%20Pretrained%20CNNs/PretrainedCNNs.ipynb) 7 | 8 | **Convolutional Neural Networks:** 9 | - Convolutions are just a type of matrix multiplication with two constraints on the weight matrix: some elements are always zero and some elements are tied or forced to always have the same value. Batch Normalization adds some extra randomness to the training process. Larger batches have gradients that are more accurate since they are calculated from more data. But larger batch size means fewer batches per epoch which means fewer opportunities for the model to update weights. VGG16, VGG19, and ResNet all accept 224 x 224 input images while InceptionV3 and Xception requires 299 x 299 pixel inputs. 10 | 11 | ![Image](https://github.com/ThinamXx/MachineLearning_DeepLearning/blob/main/Images/Day%2019.PNG) 12 | 13 | -------------------------------------------------------------------------------- /04. Neural Networks/README.md: -------------------------------------------------------------------------------- 1 | # **Computer Vision: Neural Networks** 2 | 3 | The [**Neural Networks**](https://github.com/ThinamXx/ComputerVision/blob/main/04.%20Neural%20Networks/NeuralNetworks.ipynb) notebook contains the implementation of **Perceptron** algorithm, backpropagation algorithm, and neural networks from scratch. 4 | 5 | 📚**Notebooks:** 6 | - [**Neural Network**](https://github.com/ThinamXx/ComputerVision/blob/main/04.%20Neural%20Networks/NeuralNetworks.ipynb) 7 | 8 | **Rectified Linear Unit** 9 | - ReLU is zero for negative inputs but increases linearly for positive inputs. The ReLU function is not saturable and is also extremely computationally efficient. ReLU is the most popular activation function used in deep learning and has stronger biological motivations. 10 | 11 | **Perceptron Algorithm** 12 | - I have presented the implementation of Perceptron Algorithm here in the snapshot. 13 | 14 | ![Image](https://github.com/ThinamXx/MachineLearning_DeepLearning/blob/main/Images/Day%2011.PNG) 15 | 16 | **Backpropagation Algorithm** 17 | - I have presented the implementation of Neural Network and Backpropagation here in the snapshot. 18 | 19 | ![Image](https://github.com/ThinamXx/MachineLearning_DeepLearning/blob/main/Images/Day%2012a.PNG) 20 | ![Image](https://github.com/ThinamXx/MachineLearning_DeepLearning/blob/main/Images/Day%2012b.PNG) 21 | -------------------------------------------------------------------------------- /02. ConvolutionalNeuralNetworks/README.md: -------------------------------------------------------------------------------- 1 | # **Computer Vision: Convolutional Neural Networks** 2 | 3 | The [**Convolutions**](https://github.com/ThinamXx/ComputerVision/blob/main/02.%20ConvolutionalNeuralNetworks/Convolutions.ipynb) notebook contains all the dependencies required to understand the implementation of Image Convolutions and Kernels. 4 | 5 | The [**Convolutional Layers**](https://github.com/ThinamXx/ComputerVision/blob/main/02.%20ConvolutionalNeuralNetworks/Convolutional%20Layers.ipynb) notebook contains all the dependencies required to understand Keras Conv2D Class and Convolutional Layers. 6 | 7 | **Notebooks:** 8 | - [**Convolutions**](https://github.com/ThinamXx/ComputerVision/blob/main/02.%20ConvolutionalNeuralNetworks/Convolutions.ipynb) 9 | - [**Convolutional Layers**](https://github.com/ThinamXx/ComputerVision/blob/main/02.%20ConvolutionalNeuralNetworks/Convolutional%20Layers.ipynb) 10 | 11 | **Strided Net** 12 | - I have presented the implementation of Strided Net here in the snapshot. 13 | 14 | ![Image](https://github.com/ThinamXx/300Days__MachineLearningDeepLearning/blob/main/Images/Day%20296.PNG) 15 | 16 | **Preparing Dataset** 17 | - I have presented the implementation of Label Binarizer and Preparing Dataset here in the snapshot. 18 | 19 | ![Image](https://github.com/ThinamXx/300Days__MachineLearningDeepLearning/blob/main/Images/Day%20297.PNG) 20 | 21 | **Training Model** 22 | - I have presented the implementation of Compiling and Training Model, Classification Report, Training Loss and Accuracy here in the snapshot. 23 | 24 | ![Image](https://github.com/ThinamXx/300Days__MachineLearningDeepLearning/blob/main/Images/Day%20298.PNG) 25 | -------------------------------------------------------------------------------- /08. Object Detection/README.md: -------------------------------------------------------------------------------- 1 | # **Computer Vision: Object Detection** 2 | 3 | The [**Object Detection**](https://github.com/ThinamXx/ComputerVision/blob/main/08.%20Object%20Detection/ObjectDetection.ipynb) notebook contains implementation of object detection with PyTorch and pretrained networks. It also contains brief description about object detection and image preprocessing. 4 | 5 | 📚**Notebook** 6 | - [**Object Detection**](https://github.com/ThinamXx/ComputerVision/blob/main/08.%20Object%20Detection/ObjectDetection.ipynb) 7 | 8 | **COCO Dataset** 9 | - The [COCO Dataset](https://cocodataset.org/#home): Common Objects in Context, tends to be the standard for object detection benchmarking. The dataset contains over 90 classes of common objects we will see in everyday world. 10 | 11 | **Object Detection** 12 | - Object Detection is a computer technology related to computer vision and image processing that deals with detecting instances of semantic objects of a certain class. I will use PyTorch to perform object detection using the following state-of-the-art classification networks: 13 | - Faster R-CNN with a ResNet50. 14 | - Faster R-CNN with a MobileNet V3. 15 | - RetinaNet with a ResNet50. 16 | 17 | **Image Preprocessing** 18 | - Converting color channel ordering from BGR to RGB. 19 | - Swapping color channel ordering from channels last to channels first. 20 | - Adding a batch dimension. 21 | - Scaling pixel intensities from the range [0, 255] to [0, 1]. 22 | - Converting the image from a numpy array to a floating point tensor. 23 | 24 | ![Image](https://github.com/ThinamXx/MachineLearning_DeepLearning/blob/main/Images/Day%2020a.PNG) 25 | 26 | ![Image](https://github.com/ThinamXx/MachineLearning_DeepLearning/blob/main/Images/Day%2020b.PNG) 27 | -------------------------------------------------------------------------------- /06. VGGNet Architecture/README.md: -------------------------------------------------------------------------------- 1 | # **Computer Vision: Mini VGGNet Architecture** 2 | 3 | The [**Mini VGGNet**](https://github.com/ThinamXx/ComputerVision/blob/main/06.%20VGGNet%20Architecture/Mini%20VGGNet.ipynb) notebook contains the implementation of VGGNet Architecture. It makes the use of only *3 X 3* filters regardless of network depth. 4 | 5 | 📚**Notebook** 6 | - [**Mini VGGNet Architecture**](https://github.com/ThinamXx/ComputerVision/blob/main/06.%20VGGNet%20Architecture/Mini%20VGGNet.ipynb) 7 | 8 | **Logistic Regression** 9 | - However, when unnecessary or excessive number of variables is used in logistic regression model, peculiarities i.e. special attributes of the underlying dataset disproportionately affect the coefficient of the model, the phenomena commonly known as overfitting. So, it is most important that the logistic regression model doesn't start training more variables than is justified for the given number of observations. 10 | 11 | **Batch Normalization** 12 | - Batch Normalization can lead to a faster, more stable convergence with higher accuracy. Batch Normalization will require more wall time to train the network even though the network will obtain higher accuracy in less epochs. 13 | 14 | **VGGNet Architecture** 15 | - I will define the build method of Mini VGGNet architecture below. It requires four parameters: width of input image, height of input image, depth of image, number of class labels in the classification task. The Sequential class, the building block of sequential networks sequentially stack one layer on top of the other layer initialized below. Batch Normalization operates over the channels, so in order to apply BN, we need to know which axis to normalize over. 16 | 17 | ![Image](https://github.com/ThinamXx/MachineLearning_DeepLearning/blob/main/Images/Day%2017.PNG) 18 | -------------------------------------------------------------------------------- /01. OpenCV/README.md: -------------------------------------------------------------------------------- 1 | # **Computer Vision: OpenCV** 2 | 3 | The [**OpenCV**](https://github.com/ThinamXx/ComputerVision/blob/main/01.%20OpenCV/OpenCV.ipynb) notebook contains the basics of **OpenCV** such as Loading an Image, Resizing Images, Rotating Image, Edge Detection, Thresholding, Drawing and Masking, Contour and Shape Detection. 4 | 5 | The [**OCV Project I**](https://github.com/ThinamXx/ComputerVision/blob/main/01.%20OpenCV/OCV%20Project%20I.ipynb) notebook contains the implementation of Rotating Images correctly without cut off. 6 | 7 | The [**OCV Project II**](https://github.com/ThinamXx/ComputerVision/blob/main/01.%20OpenCV/OCV%20Project%20II.ipynb) notebook contains the implementation of Color Detection and Histogram Matching on images. 8 | 9 | **Note:** 10 | - 📑[**OpenCV**](https://github.com/ThinamXx/ComputerVision/blob/main/01.%20OpenCV/OpenCV.ipynb) 11 | - 📑[**OCV Project I**](https://github.com/ThinamXx/ComputerVision/blob/main/01.%20OpenCV/OCV%20Project%20I.ipynb) 12 | - 📑[**OCV Project II**](https://github.com/ThinamXx/ComputerVision/blob/main/01.%20OpenCV/OCV%20Project%20II.ipynb) 13 | 14 | **Image Processing** 15 | - I have presented the implementation of OpenCV in Resizing and Rotating and Image, Smoothing and Drawing on an Image, Converting Image to Grayscale, Edge Detection, Thresholding, Detecting and Drawing Contours, Erosions and Dilations here in the snapshot. 16 | 17 | ![Image](https://github.com/ThinamXx/300Days__MachineLearningDeepLearning/blob/main/Images/Day%20291.PNG) 18 | ![Image](https://github.com/ThinamXx/300Days__MachineLearningDeepLearning/blob/main/Images/Day%20292.PNG) 19 | 20 | **Rotating Image** 21 | - I have presented the implementation of OpenCV in Rotating Images and Getting ROI of Images here in the snapshot. 22 | 23 | ![Image](https://github.com/ThinamXx/300Days__MachineLearningDeepLearning/blob/main/Images/Day%20293.PNG) 24 | 25 | **Histogram Matching** 26 | - Histogram Matching can be used as a normalization technique in an image processing pipeline as a form of color correction and color matching which allows to obtain a consistent, normalized representation of images even if lighting conditions change. I have presented the implementation of OpenCV in Histogram Matching here in the snapshot. 27 | 28 | ![Image](https://github.com/ThinamXx/300Days__MachineLearningDeepLearning/blob/main/Images/Day%20294.PNG) 29 | -------------------------------------------------------------------------------- /03. Image Classification/Scripts/simplepreprocessor.py: -------------------------------------------------------------------------------- 1 | #@ IMPORTING LIBRARIES AND PACKAGES: 2 | import cv2 3 | import numpy as np 4 | import os 5 | 6 | #@ INITIALIZING SIMPLE PREPROCESSOR: 7 | class SimplePreprocessor: # Defining Simple Preprocessor. 8 | def __init__(self, width, height, inter=cv2.INTER_AREA): # Initializing Constructor Function. 9 | self.width = width # Initialization. 10 | self.height = height # Initialization. 11 | self.inter = inter # Initialization. 12 | 13 | def preprocess(self, image): # Defining Preprocess Function. 14 | return cv2.resize(image, (self.width, self.height), 15 | interpolation=self.inter) # Resizing Image. 16 | 17 | 18 | #@ INITIALIZING DATASET LOADER: 19 | class SimpleDatasetLoader: # Defining Simple Image Loader. 20 | def __init__(self, preprocessors=None): # Initializing Constructor Function. 21 | self.preprocessors = preprocessors # Initialization. 22 | if self.preprocessors is None: # Inspection. 23 | self.preprocessors = [] # Initializing Empty List. 24 | 25 | def load(self, imagePaths, verbose=-1): # Defining Load Function. 26 | data, labels = [], [] # Initializing Empty List. 27 | for (i, imagePath) in enumerate(imagePaths): 28 | image = cv2.imread(imagePath) # Reading Image. 29 | label = imagePath.split(os.path.sep)[-2] # Getting Labels. 30 | if self.preprocessors is not None: 31 | for p in self.preprocessors: 32 | image = p.preprocess(image) # Preprocessing Image. 33 | data.append(image) # Updating Data. 34 | labels.append(label) # Updating Label. 35 | if verbose > 0 and i > 0 and (i+1)%verbose == 0: 36 | print("[INFO] processed {}/{}".format( 37 | i + 1, len(imagePaths))) # Showing Updates. 38 | return (np.array(data), np.array(labels)) # Initializing Array of Data. 39 | 40 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | # **COMPUTER VISION** 2 | 3 | The repository contains a list of projects and notebooks which I have worked on while reading Computer Vision, Deep Learning and OpenCV from [**PyImageSearch**](https://www.pyimagesearch.com/). 4 | 5 | ### 📚**NOTEBOOKS:** 6 | 7 | [**1. OPEN CV**](https://github.com/ThinamXx/ComputerVision/tree/main/01.%20OpenCV) 8 | - The **OpenCV** notebook contains the basics of OpenCV such as Loading an Image, Resizing Images, Rotating Image, Edge Detection, Thresholding, Drawing and Masking, Contour and Shape Detection. The **OCV Project I** notebook contains the implementation of Rotating Images correctly without cut off. The OCV Project II notebook contains the implementation of Color Detection and Histogram Matching on images. 9 | 10 | [**2. CONVOLUTIONAL NEURAL NETWORKS**](https://github.com/ThinamXx/ComputerVision/tree/main/02.%20ConvolutionalNeuralNetworks) 11 | - The **Convolutions** notebook contains all the dependencies required to understand the implementation of Image Convolutions and Kernels. The **Convolutional Layers** notebook contains all the dependencies required to understand Keras Conv2D Class and Convolutional Layers. 12 | 13 | [**3. IMAGE CLASSIFICATION**](https://github.com/ThinamXx/ComputerVision/tree/main/03.%20Image%20Classification) 14 | - The **Simplepreprocessor** notebook contains implementation of simple image preprocessor, loading an image dataset into memory, and K-Nearest Neighbor Classifier. K-Nearest Neighbor Classifier doesn’t actually learn anything, but it directly relies on the distance between feature vectors. The **GradientDescent** notebook contains implementation of Gradient Descent Algorithms. The **StochasticGradientDescent** notebook contains implementation of Stochastic Gradient Descent, Image Classification and Regularization. 15 | 16 | [**4. NEURAL NETWORKS**](https://github.com/ThinamXx/ComputerVision/tree/main/04.%20Neural%20Networks) 17 | - The **Neural Networks** notebook contains the implementation of Perceptron algorithm, backpropagation algorithm, and neural networks from scratch. 18 | 19 | [**5. LENET ARCHITECTURE**](https://github.com/ThinamXx/ComputerVision/tree/main/05.%20LeNet%20Architecture) 20 | - The **LeNet Architecture** notebook contains the implementation of LeNet Architecture. LeNet is a seminal work in the deep learning literature which demonstrates how neural networks could be trained to recognize objects in images without feture extraction. 21 | 22 | [**6. VGGNET ARCHITECTURE**](https://github.com/ThinamXx/ComputerVision/tree/main/06.%20VGGNet%20Architecture) 23 | - The **Mini VGGNet** notebook contains the implementation of VGGNet Architecture. It makes the use of only 3 X 3 filters regardless of network depth. 24 | 25 | [**7. PRETRAINED CNN**](https://github.com/ThinamXx/ComputerVision/tree/main/07.%20Pretrained%20CNNs) 26 | - The **Pretrained CNNs** notebook contains the reviews of convolutional neural networks and implementation of VGG16 and Xception networks for classification of images. 27 | 28 | [**8. OBJECT DETECTION**](https://github.com/ThinamXx/ComputerVision/tree/main/08.%20Object%20Detection) 29 | - The **Object Detection** notebook contains implementation of object detection with PyTorch and pretrained networks. It also contains brief description about object detection and image preprocessing. 30 | -------------------------------------------------------------------------------- /03. Image Classification/README.md: -------------------------------------------------------------------------------- 1 | # **Computer Vision: Image Classification** 2 | 3 | The [**Simplepreprocessor**](https://github.com/ThinamXx/ComputerVision/blob/main/03.%20Image%20Classification/Simplepreprocessor.ipynb) notebook contains implementation of simple image preprocessor, loading an image dataset into memory, and K-Nearest Neighbor Classifier. K-Nearest Neighbor Classifier doesn’t actually learn anything, but it directly relies on the distance between feature vectors. 4 | 5 | The [**GradientDescent**](https://github.com/ThinamXx/ComputerVision/blob/main/03.%20Image%20Classification/GradientDescent.ipynb) notebook contains implementation of Gradient Descent Algorithms. 6 | 7 | The [**StochasticGradientDescent**](https://github.com/ThinamXx/ComputerVision/blob/main/03.%20Image%20Classification/StochasticGradientDescent.ipynb) notebook contains implementation of Stochastic Gradient Descent, Image Classification and Regularization. 8 | 9 | **Notebook:** 10 | - 📑[**Simplepreprocessor**](https://github.com/ThinamXx/ComputerVision/blob/main/03.%20Image%20Classification/Simplepreprocessor.ipynb) 11 | - 📑[**LinearClassifier**](https://github.com/ThinamXx/ComputerVision/blob/main/03.%20Image%20Classification/LinearClassifier.ipynb) 12 | - 📑[**GradientDescent**](https://github.com/ThinamXx/ComputerVision/blob/main/03.%20Image%20Classification/GradientDescent.ipynb) 13 | - 📑[**StochasticGradientDescent**](https://github.com/ThinamXx/ComputerVision/blob/main/03.%20Image%20Classification/StochasticGradientDescent.ipynb) 14 | 15 | **Linear Classifier** 16 | - I have presented the notes about K-Nearest Neighbor and Parameterized Learning here in the snapshot. 17 | 18 | ![Image](https://github.com/ThinamXx/MachineLearning_DeepLearning/blob/main/Images/Day%204.PNG) 19 | 20 | **Gradient Descent** 21 | - The gradient descent method is an iterative optimization algorithm that operates over a loss landscape also called and optimization surface. Also, gradient descent refers to the process of attempting to optimize the parameters for low loss and high classification accuracy via an iterative process of taking a step in the direction that minimize loss. I have presented the notes about Gradient Descent and Optimization here in the snapshot. 22 | 23 | ![Image](https://github.com/ThinamXx/MachineLearning_DeepLearning/blob/main/Images/Day%205.PNG) 24 | 25 | **Stochastic Gradient Descent** 26 | - Stochastic Gradient Descent is a simple modification to the standard gradient descent algorithm that computes the gradient and updates the weight matrix on small batches of training data, rather than the entire training set. I have presented the implementation of Sigmoid Activation Function and Stochastic Gradient Descent and notes about Regularization here in the snapshots. 27 | 28 | ![Image](https://github.com/ThinamXx/MachineLearning_DeepLearning/blob/main/Images/Day%207a.PNG) 29 | ![Image](https://github.com/ThinamXx/MachineLearning_DeepLearning/blob/main/Images/Day%207b.PNG) 30 | 31 | **Simple Preprocessor and Dataset Loader** 32 | - I will build an image preprocessor that resizes the image, ignoring the aspect ratio. I have presented the implementation of Image Preprocessor and Dataset Loader here in the snapshot. 33 | 34 | ![Image](https://github.com/ThinamXx/MachineLearning_DeepLearning/blob/main/Images/Day%202.PNG) 35 | 36 | **K-Nearest Neighbor** 37 | - K-Nearest Neighbor Classifier doesn’t actually learn anything, but it directly relies on the distance between feature vectors. I have presented the implementation of K-Nearest Neighbor Classifier and Model Evaluation here in the snapshot. 38 | 39 | ![Image](https://github.com/ThinamXx/MachineLearning_DeepLearning/blob/main/Images/Day%203.PNG) 40 | -------------------------------------------------------------------------------- /03. Image Classification/Simplepreprocessor.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "nbformat": 4, 3 | "nbformat_minor": 0, 4 | "metadata": { 5 | "colab": { 6 | "name": "Simplepreprocessor.ipynb", 7 | "provenance": [], 8 | "collapsed_sections": [] 9 | }, 10 | "kernelspec": { 11 | "name": "python3", 12 | "display_name": "Python 3" 13 | }, 14 | "language_info": { 15 | "name": "python" 16 | } 17 | }, 18 | "cells": [ 19 | { 20 | "cell_type": "markdown", 21 | "metadata": { 22 | "id": "xb0Eq2h3pkY0" 23 | }, 24 | "source": [ 25 | "**LIBRARIES AND DEPENDENCIES:**\n", 26 | "- I have downloaded all the libraries and dependencies required for the project in one particular cell." 27 | ] 28 | }, 29 | { 30 | "cell_type": "code", 31 | "metadata": { 32 | "id": "KpbKYZvxiPTd" 33 | }, 34 | "source": [ 35 | "#@ GETTING LIBRARIES AND DEPENDENCIES: UNCOMMENT BELOW: \n", 36 | "# !python /content/simplepreprocessor.py" 37 | ], 38 | "execution_count": 1, 39 | "outputs": [] 40 | }, 41 | { 42 | "cell_type": "code", 43 | "metadata": { 44 | "id": "eBJAB3K7jiZZ" 45 | }, 46 | "source": [ 47 | "#@ IMPORTING LIBRARIES AND PACKAGES: \n", 48 | "import cv2\n", 49 | "import numpy as np\n", 50 | "import os\n", 51 | "\n", 52 | "from sklearn.neighbors import KNeighborsClassifier\n", 53 | "from sklearn.preprocessing import LabelEncoder\n", 54 | "from sklearn.model_selection import train_test_split\n", 55 | "from sklearn.metrics import classification_report\n", 56 | "from simplepreprocessor import SimplePreprocessor\n", 57 | "from simplepreprocessor import SimpleDatasetLoader \n", 58 | "from imutils import paths" 59 | ], 60 | "execution_count": 2, 61 | "outputs": [] 62 | }, 63 | { 64 | "cell_type": "markdown", 65 | "metadata": { 66 | "id": "GwfQHwzSp3U8" 67 | }, 68 | "source": [ 69 | "**IMAGE PREPROCESSOR:**\n", 70 | "- I will build an image preprocessor that resizes the image, ignoring the aspect ratio. " 71 | ] 72 | }, 73 | { 74 | "cell_type": "code", 75 | "metadata": { 76 | "id": "pL3kk7skj0k4" 77 | }, 78 | "source": [ 79 | "#@ INITIALIZING SIMPLE PREPROCESSOR:\n", 80 | "class SimplePreprocessor: # Defining Simple Preprocessor. \n", 81 | " def __init__(self, width, height, inter=cv2.INTER_AREA): # Initializing Constructor Function. \n", 82 | " self.width = width # Initialization. \n", 83 | " self.height = height # Initialization. \n", 84 | " self.inter = inter # Initialization. \n", 85 | "\n", 86 | " def preprocess(self, image): # Defining Preprocess Function. \n", 87 | " return cv2.resize(image, (self.width, self.height), \n", 88 | " interpolation=self.inter) # Resizing Image. " 89 | ], 90 | "execution_count": 3, 91 | "outputs": [] 92 | }, 93 | { 94 | "cell_type": "markdown", 95 | "metadata": { 96 | "id": "Awkasacxq1OB" 97 | }, 98 | "source": [ 99 | "**IMAGE LOADER:**" 100 | ] 101 | }, 102 | { 103 | "cell_type": "code", 104 | "metadata": { 105 | "id": "tJGbNAsGleV0" 106 | }, 107 | "source": [ 108 | "#@ INITIALIZING DATASET LOADER: \n", 109 | "class SimpleDatasetLoader: # Defining Simple Image Loader. \n", 110 | " def __init__(self, preprocessors=None): # Initializing Constructor Function. \n", 111 | " self.preprocessors = preprocessors # Initialization. \n", 112 | " if self.preprocessors is None: # Inspection. \n", 113 | " self.preprocessors = [] # Initializing Empty List.\n", 114 | " \n", 115 | " def load(self, imagePaths, verbose=-1): # Defining Load Function. \n", 116 | " data, labels = [], [] # Initializing Empty List.\n", 117 | " for (i, imagePath) in enumerate(imagePaths):\n", 118 | " image = cv2.imread(imagePath) # Reading Image. \n", 119 | " label = imagePath.split(os.path.sep)[-2] # Getting Labels. \n", 120 | " if self.preprocessors is not None:\n", 121 | " for p in self.preprocessors:\n", 122 | " image = p.preprocess(image) # Preprocessing Image. \n", 123 | " data.append(image) # Updating Data. \n", 124 | " labels.append(label) # Updating Label. \n", 125 | " if verbose > 0 and i > 0 and (i+1)%verbose == 0:\n", 126 | " print(\"[INFO] processed {}/{}\".format(\n", 127 | " i + 1, len(imagePaths))) # Showing Updates. \n", 128 | " return (np.array(data), np.array(labels)) # Initializing Array of Data. " 129 | ], 130 | "execution_count": 4, 131 | "outputs": [] 132 | }, 133 | { 134 | "cell_type": "markdown", 135 | "metadata": { 136 | "id": "ewSTj0enq6PM" 137 | }, 138 | "source": [ 139 | "**K-NEAREST NEIGHBOR:**" 140 | ] 141 | }, 142 | { 143 | "cell_type": "code", 144 | "metadata": { 145 | "id": "y9x1Shb0sYg2" 146 | }, 147 | "source": [ 148 | "#@ GETTING DATASET: UNCOMMENT BELOW: \n", 149 | "# !unzip /content/drive/MyDrive/Data/animals.zip" 150 | ], 151 | "execution_count": 6, 152 | "outputs": [] 153 | }, 154 | { 155 | "cell_type": "code", 156 | "metadata": { 157 | "id": "CtUp594awpEO", 158 | "colab": { 159 | "base_uri": "https://localhost:8080/" 160 | }, 161 | "outputId": "b10b0fac-6de6-406f-b36a-ee3558e1a1a1" 162 | }, 163 | "source": [ 164 | "#@ PREPROCESSING DATASET: \n", 165 | "imagePaths = list(paths.list_images(\"/content/animals\")) # Getting Image Paths. \n", 166 | "sp = SimplePreprocessor(32, 32) # Initializing Image Resizing. \n", 167 | "sdl = SimpleDatasetLoader(preprocessors=[sp]) # Initializing Dataset Loader. \n", 168 | "(data, labels) = sdl.load(imagePaths, verbose=500) # Initializing Data and Labels. \n", 169 | "data = data.reshape((data.shape[0], 3072)) # Initializing Flatten. \n", 170 | "\n", 171 | "#@ ENCODING LABELS: \n", 172 | "le = LabelEncoder() # Initializing Label Encoder. \n", 173 | "labels = le.fit_transform(labels) # Encoding Labels as Integers. \n", 174 | "(trainX, testX, trainY, testY) = train_test_split(\n", 175 | " data, labels, test_size=0.25, random_state=42) # Initializing Training and Testing. \n", 176 | "\n", 177 | "#@ K-NEAREST NEIGHBOR ALGORITHMS: \n", 178 | "model = KNeighborsClassifier(n_neighbors=1, n_jobs=-1) # Initializing KNN Classifier. \n", 179 | "model.fit(trainX, trainY) # Training KNN Classifier. \n", 180 | "print(classification_report(testY, model.predict(testX), \n", 181 | " target_names=le.classes_)) # Inspecting Classification Report. " 182 | ], 183 | "execution_count": 8, 184 | "outputs": [ 185 | { 186 | "output_type": "stream", 187 | "name": "stdout", 188 | "text": [ 189 | "[INFO] processed 500/3000\n", 190 | "[INFO] processed 1000/3000\n", 191 | "[INFO] processed 1500/3000\n", 192 | "[INFO] processed 2000/3000\n", 193 | "[INFO] processed 2500/3000\n", 194 | "[INFO] processed 3000/3000\n", 195 | " precision recall f1-score support\n", 196 | "\n", 197 | " cats 0.41 0.53 0.46 249\n", 198 | " dogs 0.37 0.49 0.42 239\n", 199 | " panda 0.80 0.33 0.46 262\n", 200 | "\n", 201 | " accuracy 0.45 750\n", 202 | " macro avg 0.52 0.45 0.45 750\n", 203 | "weighted avg 0.53 0.45 0.45 750\n", 204 | "\n" 205 | ] 206 | } 207 | ] 208 | } 209 | ] 210 | } -------------------------------------------------------------------------------- /05. LeNet Architecture/LeNet.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "nbformat": 4, 3 | "nbformat_minor": 0, 4 | "metadata": { 5 | "colab": { 6 | "name": "LeNet.ipynb", 7 | "provenance": [], 8 | "collapsed_sections": [] 9 | }, 10 | "kernelspec": { 11 | "name": "python3", 12 | "display_name": "Python 3" 13 | }, 14 | "language_info": { 15 | "name": "python" 16 | }, 17 | "accelerator": "GPU" 18 | }, 19 | "cells": [ 20 | { 21 | "cell_type": "markdown", 22 | "source": [ 23 | "**INITIALIZATION:**\n", 24 | "- I use these three lines of code on top of my each notebooks because it will help to prevent any problems while reloading the same project. And the third line of code helps to make visualization within the notebook." 25 | ], 26 | "metadata": { 27 | "id": "N1PzyssnEIti" 28 | } 29 | }, 30 | { 31 | "cell_type": "code", 32 | "execution_count": 1, 33 | "metadata": { 34 | "id": "1_wJNjd8DzuH" 35 | }, 36 | "outputs": [], 37 | "source": [ 38 | "#@ INITIALIZATION: \n", 39 | "%reload_ext autoreload\n", 40 | "%autoreload 2\n", 41 | "%matplotlib inline" 42 | ] 43 | }, 44 | { 45 | "cell_type": "markdown", 46 | "source": [ 47 | "**LIBRARIES AND DEPENDENCIES:**\n", 48 | "- I have downloaded all the libraries and dependencies required for the project in one particular cell." 49 | ], 50 | "metadata": { 51 | "id": "h-6DXIcJEc7v" 52 | } 53 | }, 54 | { 55 | "cell_type": "code", 56 | "source": [ 57 | "#@ IMPORTING NECESSARY LIBRARIES AND DEPENDENCIES:\n", 58 | "from keras.models import Sequential\n", 59 | "from keras.layers.convolutional import Conv2D\n", 60 | "from keras.layers.convolutional import MaxPooling2D\n", 61 | "from keras.layers.core import Activation\n", 62 | "from keras.layers.core import Flatten\n", 63 | "from keras.layers.core import Dense\n", 64 | "from keras import backend as K\n", 65 | "from tensorflow.keras.optimizers import SGD\n", 66 | "from tensorflow.keras.datasets import mnist\n", 67 | "\n", 68 | "from sklearn.preprocessing import LabelBinarizer\n", 69 | "from sklearn.model_selection import train_test_split\n", 70 | "from sklearn.metrics import classification_report\n", 71 | "\n", 72 | "import matplotlib.pyplot as plt\n", 73 | "import numpy as np" 74 | ], 75 | "metadata": { 76 | "id": "fckOv3DcEad3" 77 | }, 78 | "execution_count": 2, 79 | "outputs": [] 80 | }, 81 | { 82 | "cell_type": "markdown", 83 | "source": [ 84 | "**LENET ARCHITECTURE:**\n", 85 | "- I will define the build method of **LeNet** architecture below. It requires four parameters: **width** of input image, **height** of input image, **depth** of image, number of **class labels** in the classification task. The **Sequential** class, the building block of sequential networks sequentially stack one layer on top of the other layer initialized below. " 86 | ], 87 | "metadata": { 88 | "id": "nQfvI-1YFaYo" 89 | } 90 | }, 91 | { 92 | "cell_type": "code", 93 | "source": [ 94 | "#@ DEFINING LENET ARCHITECTURE: \n", 95 | "class LeNet: # Defining LeNet Class. \n", 96 | " @staticmethod\n", 97 | " def build(width, height, depth, classes): # Defining Build Method. \n", 98 | " model = Sequential() # Initializing Sequential Model. \n", 99 | " inputShape = (height, width, depth) # Initializing Input Shape. \n", 100 | " if K.image_data_format() == \"channels_first\":\n", 101 | " inputShape = (depth, height, width) # Initializing Input Shape. \n", 102 | " model.add(Conv2D(20, (5, 5), padding=\"same\", \n", 103 | " input_shape=inputShape)) # Adding Convolutional Layer. \n", 104 | " model.add(Activation(\"relu\")) # Adding RELU Activation Function. \n", 105 | " model.add(MaxPooling2D(pool_size=(2,2),strides=(2,2))) # Decreasing 75% Input Size. \n", 106 | " model.add(Conv2D(50, (5, 5), padding=\"same\")) # Adding Convolutional Layer. \n", 107 | " model.add(Activation(\"relu\")) # Adding RELU Activation Function. \n", 108 | " model.add(MaxPooling2D(pool_size=(2,2),strides=(2,2))) # Decreasing 75% Input Size. \n", 109 | " model.add(Flatten()) # Adding Flatten Layer. \n", 110 | " model.add(Dense(500)) # Adding Fully Connected Layer. \n", 111 | " model.add(Activation(\"relu\")) # Adding RELU Activation Function. \n", 112 | " model.add(Dense(classes)) # Adding FC Dense Layer. \n", 113 | " model.add(Activation(\"softmax\")) # Adding Softmax Classifier. \n", 114 | " return model" 115 | ], 116 | "metadata": { 117 | "id": "bRzJKnSkFPO0" 118 | }, 119 | "execution_count": 3, 120 | "outputs": [] 121 | }, 122 | { 123 | "cell_type": "markdown", 124 | "source": [ 125 | "**LENET on MNIST:**\n", 126 | "- Each **MNIST** sample inside data is represented by a 784 dimensional raw pixel intensities of a 28X28 grayscale image. " 127 | ], 128 | "metadata": { 129 | "id": "WuUq9MJ4JhbA" 130 | } 131 | }, 132 | { 133 | "cell_type": "code", 134 | "source": [ 135 | "#@ GETTING THE DATASET: \n", 136 | "((trainData, trainLabels), (testData, testLabels)) = mnist.load_data() # Loading the Dataset. \n", 137 | "if K.image_data_format() == \"channels_first\":\n", 138 | " trainData = trainData.reshape((trainData.shape[0], 1, 28, 28)) # Reshaping the Dataset. \n", 139 | " testData = testData.reshape((testData.shape[0], 1, 28, 28)) # Reshaping the Dataset. \n", 140 | "else:\n", 141 | " trainData = trainData.reshape((trainData.shape[0], 28, 28, 1)) # Reshaping the Dataset. \n", 142 | " testData = testData.reshape((testData.shape[0], 28, 28, 1)) # Reshaping the Dataset. " 143 | ], 144 | "metadata": { 145 | "id": "3Xy_eCn7JV5q" 146 | }, 147 | "execution_count": 5, 148 | "outputs": [] 149 | }, 150 | { 151 | "cell_type": "code", 152 | "source": [ 153 | "#@ PROCESSING THE DATASET: \n", 154 | "trainData = trainData.astype('float32') / 255.0 # Normalizing the Data.\n", 155 | "testData = testData.astype('float32') / 255.0 # Normalizing the Data. \n", 156 | "lb = LabelBinarizer() # Initializing LabelBinarizer. \n", 157 | "trainLabels = lb.fit_transform(trainLabels) # Converting Labels into Vectors. \n", 158 | "testLabels = lb.transform(testLabels) # Converting Labels into Vectors. " 159 | ], 160 | "metadata": { 161 | "id": "WHXoDocPGa_0" 162 | }, 163 | "execution_count": 6, 164 | "outputs": [] 165 | }, 166 | { 167 | "cell_type": "code", 168 | "source": [ 169 | "#@ INITIALIZING OPTIMIZER AND MODEL: \n", 170 | "opt = SGD(0.01) # Initializing SGD Optimizer. \n", 171 | "model = LeNet.build(width=28, height=28, depth=1, classes=10) # Initializing LeNet Architecture. \n", 172 | "model.compile(loss=\"categorical_crossentropy\",optimizer=opt,\n", 173 | " metrics=[\"accuracy\"]) # Compiling LeNet Model. \n", 174 | "H = model.fit(trainData, trainLabels, \n", 175 | " validation_data=(testData, testLabels), \n", 176 | " batch_size=128, epochs=20, verbose=1) # Training LeNet Model." 177 | ], 178 | "metadata": { 179 | "id": "DZ6N_dwXNnMS", 180 | "colab": { 181 | "base_uri": "https://localhost:8080/" 182 | }, 183 | "outputId": "73d12ac8-a931-45d1-e73e-f3a940606393" 184 | }, 185 | "execution_count": 7, 186 | "outputs": [ 187 | { 188 | "output_type": "stream", 189 | "name": "stdout", 190 | "text": [ 191 | "Epoch 1/20\n", 192 | "469/469 [==============================] - 18s 13ms/step - loss: 0.9274 - accuracy: 0.7520 - val_loss: 0.3026 - val_accuracy: 0.9131\n", 193 | "Epoch 2/20\n", 194 | "469/469 [==============================] - 6s 13ms/step - loss: 0.2503 - accuracy: 0.9264 - val_loss: 0.2037 - val_accuracy: 0.9403\n", 195 | "Epoch 3/20\n", 196 | "469/469 [==============================] - 6s 12ms/step - loss: 0.1784 - accuracy: 0.9476 - val_loss: 0.1571 - val_accuracy: 0.9520\n", 197 | "Epoch 4/20\n", 198 | "469/469 [==============================] - 6s 12ms/step - loss: 0.1387 - accuracy: 0.9593 - val_loss: 0.1278 - val_accuracy: 0.9603\n", 199 | "Epoch 5/20\n", 200 | "469/469 [==============================] - 6s 13ms/step - loss: 0.1154 - accuracy: 0.9658 - val_loss: 0.1032 - val_accuracy: 0.9665\n", 201 | "Epoch 6/20\n", 202 | "469/469 [==============================] - 6s 12ms/step - loss: 0.1002 - accuracy: 0.9700 - val_loss: 0.0854 - val_accuracy: 0.9734\n", 203 | "Epoch 7/20\n", 204 | "469/469 [==============================] - 6s 12ms/step - loss: 0.0882 - accuracy: 0.9741 - val_loss: 0.0756 - val_accuracy: 0.9773\n", 205 | "Epoch 8/20\n", 206 | "469/469 [==============================] - 6s 13ms/step - loss: 0.0784 - accuracy: 0.9764 - val_loss: 0.0705 - val_accuracy: 0.9768\n", 207 | "Epoch 9/20\n", 208 | "469/469 [==============================] - 6s 14ms/step - loss: 0.0715 - accuracy: 0.9787 - val_loss: 0.0677 - val_accuracy: 0.9782\n", 209 | "Epoch 10/20\n", 210 | "469/469 [==============================] - 6s 12ms/step - loss: 0.0663 - accuracy: 0.9801 - val_loss: 0.0647 - val_accuracy: 0.9796\n", 211 | "Epoch 11/20\n", 212 | "469/469 [==============================] - 6s 12ms/step - loss: 0.0614 - accuracy: 0.9819 - val_loss: 0.0551 - val_accuracy: 0.9815\n", 213 | "Epoch 12/20\n", 214 | "469/469 [==============================] - 6s 12ms/step - loss: 0.0575 - accuracy: 0.9830 - val_loss: 0.0568 - val_accuracy: 0.9817\n", 215 | "Epoch 13/20\n", 216 | "469/469 [==============================] - 6s 12ms/step - loss: 0.0543 - accuracy: 0.9836 - val_loss: 0.0512 - val_accuracy: 0.9832\n", 217 | "Epoch 14/20\n", 218 | "469/469 [==============================] - 6s 12ms/step - loss: 0.0511 - accuracy: 0.9845 - val_loss: 0.0500 - val_accuracy: 0.9831\n", 219 | "Epoch 15/20\n", 220 | "469/469 [==============================] - 6s 12ms/step - loss: 0.0482 - accuracy: 0.9856 - val_loss: 0.0497 - val_accuracy: 0.9830\n", 221 | "Epoch 16/20\n", 222 | "469/469 [==============================] - 6s 12ms/step - loss: 0.0462 - accuracy: 0.9860 - val_loss: 0.0599 - val_accuracy: 0.9801\n", 223 | "Epoch 17/20\n", 224 | "469/469 [==============================] - 5s 12ms/step - loss: 0.0442 - accuracy: 0.9868 - val_loss: 0.0435 - val_accuracy: 0.9863\n", 225 | "Epoch 18/20\n", 226 | "469/469 [==============================] - 5s 12ms/step - loss: 0.0422 - accuracy: 0.9875 - val_loss: 0.0421 - val_accuracy: 0.9860\n", 227 | "Epoch 19/20\n", 228 | "469/469 [==============================] - 6s 12ms/step - loss: 0.0404 - accuracy: 0.9876 - val_loss: 0.0418 - val_accuracy: 0.9863\n", 229 | "Epoch 20/20\n", 230 | "469/469 [==============================] - 6s 12ms/step - loss: 0.0390 - accuracy: 0.9880 - val_loss: 0.0398 - val_accuracy: 0.9868\n" 231 | ] 232 | } 233 | ] 234 | }, 235 | { 236 | "cell_type": "markdown", 237 | "source": [ 238 | "**MODEL EVALUATION:**" 239 | ], 240 | "metadata": { 241 | "id": "j1xxfT38dUyN" 242 | } 243 | }, 244 | { 245 | "cell_type": "code", 246 | "source": [ 247 | "#@ INITIALIZING MODEL EVALUATION:\n", 248 | "predictions = model.predict(testData, batch_size=128) # Getting Model Predictions. \n", 249 | "print(classification_report(testLabels.argmax(axis=1),\n", 250 | " predictions.argmax(axis=1), \n", 251 | " target_names=[str(x) for x in lb.classes_])) # Inspecting Classification Report." 252 | ], 253 | "metadata": { 254 | "colab": { 255 | "base_uri": "https://localhost:8080/" 256 | }, 257 | "id": "Wyd0nl4H92eJ", 258 | "outputId": "2c641006-f034-4fc8-f02a-474165307e0a" 259 | }, 260 | "execution_count": 8, 261 | "outputs": [ 262 | { 263 | "output_type": "stream", 264 | "name": "stdout", 265 | "text": [ 266 | " precision recall f1-score support\n", 267 | "\n", 268 | " 0 0.98 0.99 0.99 980\n", 269 | " 1 0.99 0.99 0.99 1135\n", 270 | " 2 0.99 0.98 0.99 1032\n", 271 | " 3 0.99 0.98 0.99 1010\n", 272 | " 4 0.99 0.99 0.99 982\n", 273 | " 5 0.99 0.99 0.99 892\n", 274 | " 6 0.99 0.99 0.99 958\n", 275 | " 7 0.98 0.99 0.98 1028\n", 276 | " 8 0.99 0.98 0.98 974\n", 277 | " 9 0.99 0.97 0.98 1009\n", 278 | "\n", 279 | " accuracy 0.99 10000\n", 280 | " macro avg 0.99 0.99 0.99 10000\n", 281 | "weighted avg 0.99 0.99 0.99 10000\n", 282 | "\n" 283 | ] 284 | } 285 | ] 286 | }, 287 | { 288 | "cell_type": "code", 289 | "source": [ 290 | "#@ INSPECTING TRAINING LOSS AND ACCURACY:\n", 291 | "plt.style.use(\"ggplot\")\n", 292 | "plt.figure()\n", 293 | "plt.plot(np.arange(0, 20), H.history[\"loss\"], label=\"train_loss\")\n", 294 | "plt.plot(np.arange(0, 20), H.history[\"val_loss\"], label=\"val_loss\")\n", 295 | "plt.plot(np.arange(0, 20), H.history[\"accuracy\"], label=\"train_acc\")\n", 296 | "plt.plot(np.arange(0, 20), H.history[\"val_accuracy\"], label=\"val_acc\")\n", 297 | "plt.title(\"Training Loss and Accuracy\")\n", 298 | "plt.xlabel(\"Epoch\")\n", 299 | "plt.ylabel(\"Loss/Accuracy\")\n", 300 | "plt.legend()\n", 301 | "plt.show();" 302 | ], 303 | "metadata": { 304 | "colab": { 305 | "base_uri": "https://localhost:8080/", 306 | "height": 299 307 | }, 308 | "id": "13nhXxfDdqWn", 309 | "outputId": "47275c65-aa57-423a-8654-81434ac95c79" 310 | }, 311 | "execution_count": 9, 312 | "outputs": [ 313 | { 314 | "output_type": "display_data", 315 | "data": { 316 | "image/png": "\n", 317 | "text/plain": [ 318 | "
" 319 | ] 320 | }, 321 | "metadata": {} 322 | } 323 | ] 324 | } 325 | ] 326 | } -------------------------------------------------------------------------------- /06. VGGNet Architecture/Mini VGGNet.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "nbformat": 4, 3 | "nbformat_minor": 0, 4 | "metadata": { 5 | "colab": { 6 | "name": "Mini VGGNet.ipynb", 7 | "provenance": [] 8 | }, 9 | "kernelspec": { 10 | "name": "python3", 11 | "display_name": "Python 3" 12 | }, 13 | "language_info": { 14 | "name": "python" 15 | }, 16 | "accelerator": "GPU" 17 | }, 18 | "cells": [ 19 | { 20 | "cell_type": "markdown", 21 | "source": [ 22 | "**INITIALIZATION:**\n", 23 | "- I use these three lines of code on top of my each notebooks because it will help to prevent any problems while reloading the same project. And the third line of code helps to make visualization within the notebook." 24 | ], 25 | "metadata": { 26 | "id": "5Vmy0mCIIvZy" 27 | } 28 | }, 29 | { 30 | "cell_type": "code", 31 | "execution_count": 1, 32 | "metadata": { 33 | "id": "5L3NmJeWFUEA" 34 | }, 35 | "outputs": [], 36 | "source": [ 37 | "#@ INITIALIZATION: \n", 38 | "%reload_ext autoreload\n", 39 | "%autoreload 2\n", 40 | "%matplotlib inline" 41 | ] 42 | }, 43 | { 44 | "cell_type": "markdown", 45 | "source": [ 46 | "**LIBRARIES AND DEPENDENCIES:**\n", 47 | "- I have downloaded all the libraries and dependencies required for the project in one particular cell." 48 | ], 49 | "metadata": { 50 | "id": "tir9siflI3eF" 51 | } 52 | }, 53 | { 54 | "cell_type": "code", 55 | "source": [ 56 | "#@ IMPORTING NECESSARY LIBRARIES AND DEPENDENCIES:\n", 57 | "from keras.models import Sequential\n", 58 | "from keras.layers import BatchNormalization\n", 59 | "from keras.layers.convolutional import Conv2D\n", 60 | "from keras.layers.convolutional import MaxPooling2D\n", 61 | "from keras.layers.core import Activation\n", 62 | "from keras.layers.core import Flatten\n", 63 | "from keras.layers.core import Dense, Dropout\n", 64 | "from keras import backend as K\n", 65 | "from tensorflow.keras.optimizers import SGD\n", 66 | "from tensorflow.keras.datasets import cifar10\n", 67 | "from keras.callbacks import LearningRateScheduler\n", 68 | "\n", 69 | "from sklearn.preprocessing import LabelBinarizer\n", 70 | "from sklearn.model_selection import train_test_split\n", 71 | "from sklearn.metrics import classification_report\n", 72 | "\n", 73 | "import matplotlib.pyplot as plt\n", 74 | "import numpy as np" 75 | ], 76 | "metadata": { 77 | "id": "Bzk_8g75I05a" 78 | }, 79 | "execution_count": 3, 80 | "outputs": [] 81 | }, 82 | { 83 | "cell_type": "markdown", 84 | "source": [ 85 | "**VGG ARCHITECTURE:**\n", 86 | "- I will define the build method of Mini VGGNet architecture below. It requires four parameters: width of input image, height of input image, depth of image, number of class labels in the classification task. The Sequential class, the building block of sequential networks sequentially stack one layer on top of the other layer initialized below. Batch Normalization operates over the channels, so in order to apply BN, we need to know which axis to normalize over. " 87 | ], 88 | "metadata": { 89 | "id": "5gbRFH9iLGKN" 90 | } 91 | }, 92 | { 93 | "cell_type": "code", 94 | "source": [ 95 | "#@ DEFINING VGGNET ARCHITECTURE:\n", 96 | "class MiniVGGNet: # Defining VGG Network. \n", 97 | " @staticmethod\n", 98 | " def build(width, height, depth, classes): # Defining Build Method. \n", 99 | " model = Sequential() # Initializing Sequential Model.\n", 100 | " inputShape = (width, height, depth) # Initializing Input Shape. \n", 101 | " chanDim = -1 # Index of Channel Dimension.\n", 102 | " if K.image_data_format() == \"channels_first\":\n", 103 | " inputShape = (depth, width, height) # Initializing Input Shape. \n", 104 | " chanDim = 1 # Index of Channel Dimension. \n", 105 | " model.add(Conv2D(32, (3, 3), padding='same', \n", 106 | " input_shape=inputShape)) # Adding Convolutional Layer. \n", 107 | " model.add(Activation(\"relu\")) # Adding RELU Activation Function. \n", 108 | " model.add(BatchNormalization(axis=chanDim)) # Adding Batch Normalization Layer. \n", 109 | " model.add(Conv2D(32, (3, 3), padding='same')) # Adding Convolutional Layer. \n", 110 | " model.add(Activation(\"relu\")) # Adding RELU Activation Function. \n", 111 | " model.add(BatchNormalization(axis=chanDim)) # Adding Batch Normalization Layer. \n", 112 | " model.add(MaxPooling2D(pool_size=(2, 2))) # Adding Max Pooling Layer. \n", 113 | " model.add(Dropout(0.25)) # Adding Dropout Layer.\n", 114 | " model.add(Conv2D(64, (3, 3), padding=\"same\")) # Adding Convolutional Layer. \n", 115 | " model.add(Activation(\"relu\")) # Adding RELU Activation Function. \n", 116 | " model.add(BatchNormalization(axis=chanDim)) # Adding Batch Normalization Layer. \n", 117 | " model.add(Conv2D(64, (3, 3), padding='same')) # Adding Convolutional Layer. \n", 118 | " model.add(Activation(\"relu\")) # Adding RELU Activation Function. \n", 119 | " model.add(BatchNormalization(axis=chanDim)) # Adding Batch Normalization Layer. \n", 120 | " model.add(MaxPooling2D(pool_size=(2, 2))) # Adding Max Pooling Layer. \n", 121 | " model.add(Dropout(0.25)) # Adding Dropout Layer. \n", 122 | " model.add(Flatten()) # Adding Flatten Layer. \n", 123 | " model.add(Dense(512)) # Adding FC Dense Layer. \n", 124 | " model.add(Activation(\"relu\")) # Adding Activation Layer. \n", 125 | " model.add(BatchNormalization()) # Adding Batch Normalization Layer. \n", 126 | " model.add(Dropout(0.5)) # Adding Dropout Layer. \n", 127 | " model.add(Dense(classes)) # Adding Dense Output Layer. \n", 128 | " model.add(Activation(\"softmax\")) # Adding Softmax Layer. \n", 129 | " return model" 130 | ], 131 | "metadata": { 132 | "id": "Ej2z0nJ-Kblr" 133 | }, 134 | "execution_count": 4, 135 | "outputs": [] 136 | }, 137 | { 138 | "cell_type": "code", 139 | "source": [ 140 | "#@ CUSTOM LEARNING RATE SCHEDULER: \n", 141 | "def step_decay(epoch): # Definig step decay function. \n", 142 | " initAlpha = 0.01 # Initializing initial LR.\n", 143 | " factor = 0.25 # Initializing drop factor. \n", 144 | " dropEvery = 5 # Initializing epochs to drop. \n", 145 | " alpha = initAlpha*(factor ** np.floor((1 + epoch) / dropEvery))\n", 146 | " return float(alpha)" 147 | ], 148 | "metadata": { 149 | "id": "KwzG_O1NlqVI" 150 | }, 151 | "execution_count": 6, 152 | "outputs": [] 153 | }, 154 | { 155 | "cell_type": "markdown", 156 | "source": [ 157 | "**VGGNET ON CIFAR10**" 158 | ], 159 | "metadata": { 160 | "id": "hNQiqb5gAlAU" 161 | } 162 | }, 163 | { 164 | "cell_type": "code", 165 | "source": [ 166 | "#@ GETTING THE DATASET:\n", 167 | "((trainX, trainY), (testX, testY)) = cifar10.load_data() # Loading Dataset. \n", 168 | "trainX = trainX.astype(\"float\") / 255.0 # Normalizing Dataset. \n", 169 | "testX = testX.astype(\"float\") / 255.0 # Normalizing Dataset. \n", 170 | "\n", 171 | "#@ PREPARING THE DATASET:\n", 172 | "lb = LabelBinarizer() # Initializing LabelBinarizer. \n", 173 | "trainY = lb.fit_transform(trainY) # Converting Labels to Vectors. \n", 174 | "testY = lb.transform(testY) # Converting Labels to Vectors. \n", 175 | "labelNames = [\"airplane\", \"automobile\", \"bird\", \"cat\", \"deer\", \n", 176 | " \"dog\", \"frog\", \"horse\", \"ship\", \"truck\"] # Initializing LabelNames." 177 | ], 178 | "metadata": { 179 | "id": "z-EnWB4J-8kl" 180 | }, 181 | "execution_count": 7, 182 | "outputs": [] 183 | }, 184 | { 185 | "cell_type": "code", 186 | "source": [ 187 | "#@ INITIALIZING OPTIMIZER AND MODEL: \n", 188 | "callbacks = [LearningRateScheduler(step_decay)] # Initializing Callbacks. \n", 189 | "opt = SGD(0.01, nesterov=True, momentum=0.9) # Initializing SGD Optimizer. \n", 190 | "model = MiniVGGNet.build(width=32, height=32, depth=3, classes=10) # Initializing VGGNet Architecture. \n", 191 | "model.compile(loss=\"categorical_crossentropy\", optimizer=opt,\n", 192 | " metrics=[\"accuracy\"]) # Compiling VGGNet Model. \n", 193 | "H = model.fit(trainX, trainY, \n", 194 | " validation_data=(testX, testY), batch_size=64, \n", 195 | " epochs=40, verbose=1, callbacks=callbacks) # Training VGGNet Model." 196 | ], 197 | "metadata": { 198 | "colab": { 199 | "base_uri": "https://localhost:8080/" 200 | }, 201 | "id": "1lCPFWETBvgf", 202 | "outputId": "e1cdef1b-c28a-4e10-a935-5f602972acee" 203 | }, 204 | "execution_count": 8, 205 | "outputs": [ 206 | { 207 | "output_type": "stream", 208 | "name": "stdout", 209 | "text": [ 210 | "Epoch 1/40\n", 211 | "782/782 [==============================] - 29s 21ms/step - loss: 1.6339 - accuracy: 0.4555 - val_loss: 1.1509 - val_accuracy: 0.5970 - lr: 0.0100\n", 212 | "Epoch 2/40\n", 213 | "782/782 [==============================] - 16s 21ms/step - loss: 1.1813 - accuracy: 0.5932 - val_loss: 0.9222 - val_accuracy: 0.6733 - lr: 0.0100\n", 214 | "Epoch 3/40\n", 215 | "782/782 [==============================] - 16s 21ms/step - loss: 0.9908 - accuracy: 0.6567 - val_loss: 0.8341 - val_accuracy: 0.7159 - lr: 0.0100\n", 216 | "Epoch 4/40\n", 217 | "782/782 [==============================] - 16s 21ms/step - loss: 0.8854 - accuracy: 0.6945 - val_loss: 0.8282 - val_accuracy: 0.7167 - lr: 0.0100\n", 218 | "Epoch 5/40\n", 219 | "782/782 [==============================] - 16s 21ms/step - loss: 0.7380 - accuracy: 0.7421 - val_loss: 0.6881 - val_accuracy: 0.7598 - lr: 0.0025\n", 220 | "Epoch 6/40\n", 221 | "782/782 [==============================] - 17s 21ms/step - loss: 0.6845 - accuracy: 0.7586 - val_loss: 0.6600 - val_accuracy: 0.7711 - lr: 0.0025\n", 222 | "Epoch 7/40\n", 223 | "782/782 [==============================] - 17s 21ms/step - loss: 0.6628 - accuracy: 0.7683 - val_loss: 0.6435 - val_accuracy: 0.7744 - lr: 0.0025\n", 224 | "Epoch 8/40\n", 225 | "782/782 [==============================] - 16s 21ms/step - loss: 0.6391 - accuracy: 0.7755 - val_loss: 0.6362 - val_accuracy: 0.7784 - lr: 0.0025\n", 226 | "Epoch 9/40\n", 227 | "782/782 [==============================] - 16s 21ms/step - loss: 0.6204 - accuracy: 0.7830 - val_loss: 0.6499 - val_accuracy: 0.7744 - lr: 0.0025\n", 228 | "Epoch 10/40\n", 229 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5912 - accuracy: 0.7909 - val_loss: 0.6161 - val_accuracy: 0.7856 - lr: 6.2500e-04\n", 230 | "Epoch 11/40\n", 231 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5812 - accuracy: 0.7936 - val_loss: 0.6054 - val_accuracy: 0.7879 - lr: 6.2500e-04\n", 232 | "Epoch 12/40\n", 233 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5730 - accuracy: 0.7978 - val_loss: 0.5994 - val_accuracy: 0.7907 - lr: 6.2500e-04\n", 234 | "Epoch 13/40\n", 235 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5698 - accuracy: 0.7974 - val_loss: 0.6013 - val_accuracy: 0.7882 - lr: 6.2500e-04\n", 236 | "Epoch 14/40\n", 237 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5623 - accuracy: 0.8009 - val_loss: 0.5973 - val_accuracy: 0.7910 - lr: 6.2500e-04\n", 238 | "Epoch 15/40\n", 239 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5496 - accuracy: 0.8064 - val_loss: 0.5961 - val_accuracy: 0.7905 - lr: 1.5625e-04\n", 240 | "Epoch 16/40\n", 241 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5484 - accuracy: 0.8048 - val_loss: 0.5937 - val_accuracy: 0.7914 - lr: 1.5625e-04\n", 242 | "Epoch 17/40\n", 243 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5573 - accuracy: 0.8037 - val_loss: 0.5950 - val_accuracy: 0.7902 - lr: 1.5625e-04\n", 244 | "Epoch 18/40\n", 245 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5477 - accuracy: 0.8062 - val_loss: 0.5927 - val_accuracy: 0.7907 - lr: 1.5625e-04\n", 246 | "Epoch 19/40\n", 247 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5446 - accuracy: 0.8073 - val_loss: 0.5904 - val_accuracy: 0.7923 - lr: 1.5625e-04\n", 248 | "Epoch 20/40\n", 249 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5391 - accuracy: 0.8104 - val_loss: 0.5926 - val_accuracy: 0.7920 - lr: 3.9062e-05\n", 250 | "Epoch 21/40\n", 251 | "782/782 [==============================] - 17s 21ms/step - loss: 0.5419 - accuracy: 0.8080 - val_loss: 0.5915 - val_accuracy: 0.7929 - lr: 3.9062e-05\n", 252 | "Epoch 22/40\n", 253 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5438 - accuracy: 0.8099 - val_loss: 0.5909 - val_accuracy: 0.7925 - lr: 3.9062e-05\n", 254 | "Epoch 23/40\n", 255 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5467 - accuracy: 0.8075 - val_loss: 0.5914 - val_accuracy: 0.7919 - lr: 3.9062e-05\n", 256 | "Epoch 24/40\n", 257 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5376 - accuracy: 0.8103 - val_loss: 0.5918 - val_accuracy: 0.7920 - lr: 3.9062e-05\n", 258 | "Epoch 25/40\n", 259 | "782/782 [==============================] - 17s 21ms/step - loss: 0.5410 - accuracy: 0.8085 - val_loss: 0.5923 - val_accuracy: 0.7917 - lr: 9.7656e-06\n", 260 | "Epoch 26/40\n", 261 | "782/782 [==============================] - 17s 21ms/step - loss: 0.5406 - accuracy: 0.8084 - val_loss: 0.5910 - val_accuracy: 0.7915 - lr: 9.7656e-06\n", 262 | "Epoch 27/40\n", 263 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5384 - accuracy: 0.8097 - val_loss: 0.5901 - val_accuracy: 0.7919 - lr: 9.7656e-06\n", 264 | "Epoch 28/40\n", 265 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5431 - accuracy: 0.8089 - val_loss: 0.5915 - val_accuracy: 0.7927 - lr: 9.7656e-06\n", 266 | "Epoch 29/40\n", 267 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5417 - accuracy: 0.8095 - val_loss: 0.5921 - val_accuracy: 0.7925 - lr: 9.7656e-06\n", 268 | "Epoch 30/40\n", 269 | "782/782 [==============================] - 17s 21ms/step - loss: 0.5385 - accuracy: 0.8108 - val_loss: 0.5900 - val_accuracy: 0.7926 - lr: 2.4414e-06\n", 270 | "Epoch 31/40\n", 271 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5451 - accuracy: 0.8073 - val_loss: 0.5910 - val_accuracy: 0.7923 - lr: 2.4414e-06\n", 272 | "Epoch 32/40\n", 273 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5402 - accuracy: 0.8103 - val_loss: 0.5899 - val_accuracy: 0.7925 - lr: 2.4414e-06\n", 274 | "Epoch 33/40\n", 275 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5405 - accuracy: 0.8091 - val_loss: 0.5909 - val_accuracy: 0.7928 - lr: 2.4414e-06\n", 276 | "Epoch 34/40\n", 277 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5427 - accuracy: 0.8091 - val_loss: 0.5914 - val_accuracy: 0.7921 - lr: 2.4414e-06\n", 278 | "Epoch 35/40\n", 279 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5416 - accuracy: 0.8105 - val_loss: 0.5906 - val_accuracy: 0.7928 - lr: 6.1035e-07\n", 280 | "Epoch 36/40\n", 281 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5375 - accuracy: 0.8109 - val_loss: 0.5905 - val_accuracy: 0.7927 - lr: 6.1035e-07\n", 282 | "Epoch 37/40\n", 283 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5372 - accuracy: 0.8092 - val_loss: 0.5900 - val_accuracy: 0.7923 - lr: 6.1035e-07\n", 284 | "Epoch 38/40\n", 285 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5438 - accuracy: 0.8090 - val_loss: 0.5907 - val_accuracy: 0.7927 - lr: 6.1035e-07\n", 286 | "Epoch 39/40\n", 287 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5424 - accuracy: 0.8097 - val_loss: 0.5906 - val_accuracy: 0.7922 - lr: 6.1035e-07\n", 288 | "Epoch 40/40\n", 289 | "782/782 [==============================] - 16s 21ms/step - loss: 0.5385 - accuracy: 0.8116 - val_loss: 0.5909 - val_accuracy: 0.7928 - lr: 1.5259e-07\n" 290 | ] 291 | } 292 | ] 293 | }, 294 | { 295 | "cell_type": "markdown", 296 | "source": [ 297 | "**MODEL EVALUATION:**" 298 | ], 299 | "metadata": { 300 | "id": "VYWybYDuELRf" 301 | } 302 | }, 303 | { 304 | "cell_type": "code", 305 | "source": [ 306 | "#@ INITIALIZING MODEL EVALUATION:\n", 307 | "predictions = model.predict(testX, batch_size=64) # Getting Model Predictions. \n", 308 | "print(classification_report(testY.argmax(axis=1),\n", 309 | " predictions.argmax(axis=1), \n", 310 | " target_names=labelNames)) # Inspecting Classification Report." 311 | ], 312 | "metadata": { 313 | "colab": { 314 | "base_uri": "https://localhost:8080/" 315 | }, 316 | "id": "HZXqORsIDAtg", 317 | "outputId": "103704a3-ddf5-4503-eb09-cf1fc33fa3f3" 318 | }, 319 | "execution_count": 9, 320 | "outputs": [ 321 | { 322 | "output_type": "stream", 323 | "name": "stdout", 324 | "text": [ 325 | " precision recall f1-score support\n", 326 | "\n", 327 | " airplane 0.85 0.79 0.82 1000\n", 328 | " automobile 0.90 0.88 0.89 1000\n", 329 | " bird 0.73 0.65 0.69 1000\n", 330 | " cat 0.62 0.60 0.61 1000\n", 331 | " deer 0.72 0.81 0.76 1000\n", 332 | " dog 0.71 0.71 0.71 1000\n", 333 | " frog 0.80 0.89 0.84 1000\n", 334 | " horse 0.87 0.82 0.85 1000\n", 335 | " ship 0.89 0.89 0.89 1000\n", 336 | " truck 0.85 0.88 0.86 1000\n", 337 | "\n", 338 | " accuracy 0.79 10000\n", 339 | " macro avg 0.79 0.79 0.79 10000\n", 340 | "weighted avg 0.79 0.79 0.79 10000\n", 341 | "\n" 342 | ] 343 | } 344 | ] 345 | }, 346 | { 347 | "cell_type": "code", 348 | "source": [ 349 | "#@ INSPECTING TRAINING LOSS AND ACCURACY:\n", 350 | "plt.style.use(\"ggplot\")\n", 351 | "plt.figure()\n", 352 | "plt.plot(np.arange(0, 40), H.history[\"loss\"], label=\"train_loss\")\n", 353 | "plt.plot(np.arange(0, 40), H.history[\"val_loss\"], label=\"val_loss\")\n", 354 | "plt.plot(np.arange(0, 40), H.history[\"accuracy\"], label=\"train_acc\")\n", 355 | "plt.plot(np.arange(0, 40), H.history[\"val_accuracy\"], label=\"val_acc\")\n", 356 | "plt.title(\"Training Loss and Accuracy\")\n", 357 | "plt.xlabel(\"Epoch\")\n", 358 | "plt.ylabel(\"Loss/Accuracy\")\n", 359 | "plt.legend()\n", 360 | "plt.show();" 361 | ], 362 | "metadata": { 363 | "colab": { 364 | "base_uri": "https://localhost:8080/", 365 | "height": 299 366 | }, 367 | "id": "eCeJOSaJEdLC", 368 | "outputId": "779e2ecc-6ae8-4164-a170-6f5e8085df88" 369 | }, 370 | "execution_count": 10, 371 | "outputs": [ 372 | { 373 | "output_type": "display_data", 374 | "data": { 375 | "image/png": "\n", 376 | "text/plain": [ 377 | "
" 378 | ] 379 | }, 380 | "metadata": {} 381 | } 382 | ] 383 | }, 384 | { 385 | "cell_type": "markdown", 386 | "source": [ 387 | "**Note:**\n", 388 | "- Batch Normalization can lead to a faster, more stable convergence with higher accuracy. \n", 389 | "- Batch Normalization will require more wall time to train the network even though the network will obtain higher accuracy in less epochs. " 390 | ], 391 | "metadata": { 392 | "id": "cfm34boWToGw" 393 | } 394 | } 395 | ] 396 | } -------------------------------------------------------------------------------- /02. ConvolutionalNeuralNetworks/Convolutional Layers.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "nbformat": 4, 3 | "nbformat_minor": 0, 4 | "metadata": { 5 | "colab": { 6 | "name": "Convolutional Layers.ipynb", 7 | "provenance": [], 8 | "collapsed_sections": [] 9 | }, 10 | "kernelspec": { 11 | "name": "python3", 12 | "display_name": "Python 3" 13 | }, 14 | "language_info": { 15 | "name": "python" 16 | }, 17 | "accelerator": "GPU" 18 | }, 19 | "cells": [ 20 | { 21 | "cell_type": "markdown", 22 | "metadata": { 23 | "id": "zWddcLZPcLoU" 24 | }, 25 | "source": [ 26 | "**INITIALIZATION:**\n", 27 | "- I use these three lines of code on top of my each notebooks because it will help to prevent any problems while reloading the same project. And the third line of code helps to make visualization within the notebook." 28 | ] 29 | }, 30 | { 31 | "cell_type": "code", 32 | "metadata": { 33 | "id": "It4XA2PkcBZo" 34 | }, 35 | "source": [ 36 | "#@ INITIALIZATION: \n", 37 | "%reload_ext autoreload\n", 38 | "%autoreload 2\n", 39 | "%matplotlib inline" 40 | ], 41 | "execution_count": 3, 42 | "outputs": [] 43 | }, 44 | { 45 | "cell_type": "markdown", 46 | "metadata": { 47 | "id": "aCoJ3nIxcSfk" 48 | }, 49 | "source": [ 50 | "**DOWNLOADING LIBRARIES AND DEPENDENCIES:**\n", 51 | "- I have downloaded all the libraries and dependencies required for the project in one particular cell." 52 | ] 53 | }, 54 | { 55 | "cell_type": "code", 56 | "metadata": { 57 | "id": "tARh3Gx3cPNy" 58 | }, 59 | "source": [ 60 | "#@ DOWNLOADING LIBRARIES AND DEPENDENCIES: \n", 61 | "import cv2\n", 62 | "import imutils\n", 63 | "import numpy as np\n", 64 | "from google.colab.patches import cv2_imshow\n", 65 | "\n", 66 | "from tensorflow.keras.models import Sequential\n", 67 | "from tensorflow.keras.layers import BatchNormalization\n", 68 | "from tensorflow.keras.layers import Conv2D\n", 69 | "from tensorflow.keras.layers import Activation\n", 70 | "from tensorflow.keras.layers import Flatten, Dropout\n", 71 | "from tensorflow.keras.layers import Dense \n", 72 | "from tensorflow.keras import backend as K\n", 73 | "\n", 74 | "from sklearn.preprocessing import LabelBinarizer\n", 75 | "from sklearn.model_selection import train_test_split\n", 76 | "from sklearn.metrics import classification_report\n", 77 | "from tensorflow.keras.preprocessing.image import ImageDataGenerator\n", 78 | "from tensorflow.keras.optimizers import Adam\n", 79 | "from tensorflow.keras.regularizers import l2\n", 80 | "from imutils import paths\n", 81 | "import matplotlib.pyplot as plt\n", 82 | "import os\n", 83 | "%matplotlib inline" 84 | ], 85 | "execution_count": 4, 86 | "outputs": [] 87 | }, 88 | { 89 | "cell_type": "markdown", 90 | "metadata": { 91 | "id": "XusQfVezcewl" 92 | }, 93 | "source": [ 94 | "**GETTING THE DATA:**\n", 95 | "- I will use subset of **CALTECH-101** dataset. " 96 | ] 97 | }, 98 | { 99 | "cell_type": "code", 100 | "metadata": { 101 | "id": "65FwRa6brfTa" 102 | }, 103 | "source": [ 104 | "#@ DOWNLOADING THE DATASET: UNCOMMENT BELOW: \n", 105 | "# !tar -zxvf \"/content/drive/MyDrive/Data/101_ObjectCategories.tar.gz\" -C \"/content/\"" 106 | ], 107 | "execution_count": 6, 108 | "outputs": [] 109 | }, 110 | { 111 | "cell_type": "markdown", 112 | "metadata": { 113 | "id": "sZokBKC10hEU" 114 | }, 115 | "source": [ 116 | "**STRIDED NET:** \n", 117 | "The **StridedNet** has following important characteristics : \n", 118 | "- It uses strided convolutions rather than pooling operations to reduce volume size. \n", 119 | "- The first **Convolutional** layer uses 7X7 filters but all other layers in the network use 3X3 filters. \n", 120 | "- The normal distribution algorithm is used to initialize all weights in the network. " 121 | ] 122 | }, 123 | { 124 | "cell_type": "code", 125 | "metadata": { 126 | "id": "jHMU2OX1y9ze" 127 | }, 128 | "source": [ 129 | "#@ INITIALIZATION OF STRIDEDNET: \n", 130 | "class StridedNet: # Defining StridedNet Class. \n", 131 | " @staticmethod\n", 132 | " def build(width,height,depth,classes,reg,init=\"he_normal\"): # Defining Build Method. \n", 133 | " model = Sequential() # Initializing Sequential Model. \n", 134 | " inputShape = (height, width, depth) # Initializing Input Shape. \n", 135 | " chanDim = -1 # Initializing Channel. \n", 136 | " if K.image_data_format() == \"channels_first\": # Inspecting Data Format. \n", 137 | " inputShape = (depth, height, width) # Initializing Input Shape. \n", 138 | " chanDim = 1 # Initializing Channel. \n", 139 | " model.add(Conv2D(16,(7,7),strides=(2,2),padding=\"valid\",\n", 140 | " kernel_initializer=init,\n", 141 | " kernel_regularizer=reg,\n", 142 | " input_shape=inputShape)) # Initializing Convolutional Layer. \n", 143 | " model.add(Conv2D(32, (3,3), padding=\"same\", \n", 144 | " kernel_initializer=init,\n", 145 | " kernel_regularizer=reg)) # Initializing Convolutional Layer. \n", 146 | " model.add(Activation(\"relu\")) # Initializing Activation Function. \n", 147 | " model.add(BatchNormalization(axis=chanDim)) # Initializing BatchNormalization Layer. \n", 148 | " model.add(Conv2D(32, (3,3), strides=(2,2), padding=\"same\",\n", 149 | " kernel_initializer=init, \n", 150 | " kernel_regularizer=reg, \n", 151 | " activation=\"relu\")) # Initializing Convolutional Layer. \n", 152 | " model.add(BatchNormalization(axis=chanDim)) # Initializing BatchNormalization Layer.\n", 153 | " model.add(Dropout(0.25)) # Initializing Dropout Layer. \n", 154 | " model.add(Conv2D(64, (3,3), padding=\"same\", \n", 155 | " kernel_initializer=init, \n", 156 | " kernel_regularizer=reg)) # Initializing Convolutional Layer. \n", 157 | " model.add(Activation(\"relu\")) # Initializing Activation Function. \n", 158 | " model.add(BatchNormalization(axis=chanDim)) # Initializing BatchNormalization Layer.\n", 159 | " model.add(Conv2D(64, (3,3), strides=(2,2), padding=\"same\", \n", 160 | " kernel_initializer=init, \n", 161 | " kernel_regularizer=reg)) # Initializing Convolutional Layer. \n", 162 | " model.add(Activation(\"relu\")) # Initializing Activation Function.\n", 163 | " model.add(BatchNormalization(axis=chanDim)) # Initializing BatchNormalization Layer.\n", 164 | " model.add(Dropout(0.25)) # Initializing Dropout Layer.\n", 165 | " model.add(Conv2D(128, (3,3), padding=\"same\", \n", 166 | " kernel_initializer=init, \n", 167 | " kernel_regularizer=reg)) # Initializing Convolutional Layer. \n", 168 | " model.add(Activation(\"relu\")) # Initializing Activation Function. \n", 169 | " model.add(BatchNormalization(axis=chanDim)) # Initializing BatchNormalization Layer.\n", 170 | " model.add(Conv2D(128,(3,3), strides=(2,2), padding=\"same\", \n", 171 | " kernel_initializer=init, \n", 172 | " kernel_regularizer=reg)) # Initializing Convolutional Layer. \n", 173 | " model.add(Activation(\"relu\")) # Initializing Activation Function.\n", 174 | " model.add(BatchNormalization(axis=chanDim)) # Initializing BatchNormalization Layer.\n", 175 | " model.add(Dropout(0.25)) # Initializing Dropout Layer.\n", 176 | " model.add(Flatten()) # Initializing Fully Connected Layer. \n", 177 | " model.add(Dense(512, kernel_initializer=init)) # Initializing Dense Layer. \n", 178 | " model.add(Activation(\"relu\")) # Initializing Activation Function. \n", 179 | " model.add(BatchNormalization(axis=chanDim)) # Initializing BatchNormalization Layer.\n", 180 | " model.add(Dropout(0.5)) # Initializing Dropout Layer.\n", 181 | " model.add(Dense(classes, activation=\"softmax\")) # Initializing Dense Layer. \n", 182 | " return model" 183 | ], 184 | "execution_count": 7, 185 | "outputs": [] 186 | }, 187 | { 188 | "cell_type": "markdown", 189 | "metadata": { 190 | "id": "HaC43j2KXgqA" 191 | }, 192 | "source": [ 193 | "**PREPARING THE DATASET:**" 194 | ] 195 | }, 196 | { 197 | "cell_type": "code", 198 | "metadata": { 199 | "id": "HDK1a1jj_4Gh" 200 | }, 201 | "source": [ 202 | "#@ PREPARING THE DATASET: \n", 203 | "PATH = \"/content/101_ObjectCategories\" # Path to Dataset. \n", 204 | "LABELS = set([\"Faces\", \"Leopards\", \"Motorbikes\", \"airplanes\"]) # Initializing Labels. \n", 205 | "imagePaths = list(paths.list_images(PATH))\n", 206 | "data, labels = [], [] # Initializing List. \n", 207 | "\n", 208 | "#@ PREPARING THE DATASET: \n", 209 | "for imagePath in imagePaths:\n", 210 | " label = imagePath.split(os.path.sep)[-2] # Extracting Labels. \n", 211 | " if label not in LABELS: \n", 212 | " continue\n", 213 | " image = cv2.imread(imagePath) # Reading Image. \n", 214 | " image = cv2.resize(image, (96, 96)) # Resizing Image. \n", 215 | " data.append(image) # Updating Data. \n", 216 | " labels.append(label) # Updating Labels. " 217 | ], 218 | "execution_count": 8, 219 | "outputs": [] 220 | }, 221 | { 222 | "cell_type": "code", 223 | "metadata": { 224 | "id": "wo-EiZY3xLSe" 225 | }, 226 | "source": [ 227 | "#@ PREPARING THE DATASET: \n", 228 | "data = np.array(data, dtype=\"float\") / 255.0 # Converting into Array and Scaling. \n", 229 | "lb = LabelBinarizer() # Initializing Label Binarizer. \n", 230 | "labels = lb.fit_transform(labels) # Initializing One Hot Encoding. \n", 231 | "(trainX, testX, trainY, testY) = train_test_split(\n", 232 | " data,labels,test_size=0.25,stratify=labels,random_state=42) # Initializing Training and Test Dataset. \n", 233 | "aug = ImageDataGenerator(rotation_range=20, zoom_range=0.15, \n", 234 | " width_shift_range=0.2,\n", 235 | " height_shift_range=0.2,shear_range=0.15, \n", 236 | " horizontal_flip=True,fill_mode=\"nearest\") # Initializing Data Augmentation. " 237 | ], 238 | "execution_count": 9, 239 | "outputs": [] 240 | }, 241 | { 242 | "cell_type": "markdown", 243 | "metadata": { 244 | "id": "9mSdEjvTDQ9d" 245 | }, 246 | "source": [ 247 | "**TRAINING THE MODEL:**" 248 | ] 249 | }, 250 | { 251 | "cell_type": "code", 252 | "metadata": { 253 | "id": "39AQaVj5aUcu", 254 | "colab": { 255 | "base_uri": "https://localhost:8080/" 256 | }, 257 | "outputId": "216770fd-455e-4c9d-efd9-683e2b4ea699" 258 | }, 259 | "source": [ 260 | "#@ TRAINING THE MODEL: \n", 261 | "epochs = 50 # Initializing Epochs. \n", 262 | "opt = Adam(learning_rate=1e-4, decay=1e-4 / epochs) # Initializing Adam Optimizer. \n", 263 | "model = StridedNet.build(width=96, height=96, depth=3, \n", 264 | " classes=len(lb.classes_), reg=l2(0.0005)) # Initializing Model. \n", 265 | "model.compile(loss=\"categorical_crossentropy\", optimizer=opt, \n", 266 | " metrics=[\"accuracy\"]) # Compiling Model. \n", 267 | "H = model.fit(x=aug.flow(trainX, trainY, batch_size=32), \n", 268 | " validation_data=(testX, testY), \n", 269 | " steps_per_epoch=len(trainX) // 32, \n", 270 | " epochs=epochs) # Training Model. " 271 | ], 272 | "execution_count": 11, 273 | "outputs": [ 274 | { 275 | "output_type": "stream", 276 | "name": "stdout", 277 | "text": [ 278 | "Epoch 1/50\n", 279 | "52/52 [==============================] - 8s 118ms/step - loss: 1.8721 - accuracy: 0.5378 - val_loss: 2.1929 - val_accuracy: 0.4723\n", 280 | "Epoch 2/50\n", 281 | "52/52 [==============================] - 5s 99ms/step - loss: 1.4074 - accuracy: 0.6967 - val_loss: 1.3916 - val_accuracy: 0.7478\n", 282 | "Epoch 3/50\n", 283 | "52/52 [==============================] - 5s 99ms/step - loss: 1.2011 - accuracy: 0.7613 - val_loss: 1.5086 - val_accuracy: 0.7603\n", 284 | "Epoch 4/50\n", 285 | "52/52 [==============================] - 5s 97ms/step - loss: 1.1294 - accuracy: 0.7899 - val_loss: 1.3434 - val_accuracy: 0.8086\n", 286 | "Epoch 5/50\n", 287 | "52/52 [==============================] - 5s 101ms/step - loss: 1.0471 - accuracy: 0.8185 - val_loss: 1.3814 - val_accuracy: 0.7818\n", 288 | "Epoch 6/50\n", 289 | "52/52 [==============================] - 5s 103ms/step - loss: 1.0035 - accuracy: 0.8295 - val_loss: 1.0816 - val_accuracy: 0.8569\n", 290 | "Epoch 7/50\n", 291 | "52/52 [==============================] - 5s 104ms/step - loss: 0.9306 - accuracy: 0.8569 - val_loss: 0.9071 - val_accuracy: 0.8515\n", 292 | "Epoch 8/50\n", 293 | "52/52 [==============================] - 5s 103ms/step - loss: 0.9175 - accuracy: 0.8727 - val_loss: 0.6747 - val_accuracy: 0.9392\n", 294 | "Epoch 9/50\n", 295 | "52/52 [==============================] - 5s 102ms/step - loss: 0.8232 - accuracy: 0.8806 - val_loss: 0.7100 - val_accuracy: 0.9267\n", 296 | "Epoch 10/50\n", 297 | "52/52 [==============================] - 5s 101ms/step - loss: 0.8193 - accuracy: 0.8940 - val_loss: 0.6400 - val_accuracy: 0.9338\n", 298 | "Epoch 11/50\n", 299 | "52/52 [==============================] - 5s 102ms/step - loss: 0.8255 - accuracy: 0.8855 - val_loss: 0.6565 - val_accuracy: 0.9302\n", 300 | "Epoch 12/50\n", 301 | "52/52 [==============================] - 5s 100ms/step - loss: 0.7882 - accuracy: 0.8989 - val_loss: 0.6087 - val_accuracy: 0.9463\n", 302 | "Epoch 13/50\n", 303 | "52/52 [==============================] - 5s 101ms/step - loss: 0.7551 - accuracy: 0.9068 - val_loss: 0.6028 - val_accuracy: 0.9481\n", 304 | "Epoch 14/50\n", 305 | "52/52 [==============================] - 5s 102ms/step - loss: 0.7456 - accuracy: 0.9086 - val_loss: 0.5935 - val_accuracy: 0.9481\n", 306 | "Epoch 15/50\n", 307 | "52/52 [==============================] - 5s 102ms/step - loss: 0.7786 - accuracy: 0.9032 - val_loss: 0.5897 - val_accuracy: 0.9463\n", 308 | "Epoch 16/50\n", 309 | "52/52 [==============================] - 5s 100ms/step - loss: 0.7307 - accuracy: 0.9093 - val_loss: 0.5597 - val_accuracy: 0.9624\n", 310 | "Epoch 17/50\n", 311 | "52/52 [==============================] - 5s 101ms/step - loss: 0.6842 - accuracy: 0.9275 - val_loss: 0.5633 - val_accuracy: 0.9517\n", 312 | "Epoch 18/50\n", 313 | "52/52 [==============================] - 5s 99ms/step - loss: 0.6784 - accuracy: 0.9348 - val_loss: 0.5626 - val_accuracy: 0.9606\n", 314 | "Epoch 19/50\n", 315 | "52/52 [==============================] - 5s 101ms/step - loss: 0.7007 - accuracy: 0.9245 - val_loss: 0.5427 - val_accuracy: 0.9624\n", 316 | "Epoch 20/50\n", 317 | "52/52 [==============================] - 5s 99ms/step - loss: 0.6692 - accuracy: 0.9348 - val_loss: 0.5800 - val_accuracy: 0.9606\n", 318 | "Epoch 21/50\n", 319 | "52/52 [==============================] - 5s 101ms/step - loss: 0.6413 - accuracy: 0.9379 - val_loss: 0.5528 - val_accuracy: 0.9642\n", 320 | "Epoch 22/50\n", 321 | "52/52 [==============================] - 5s 102ms/step - loss: 0.6770 - accuracy: 0.9275 - val_loss: 0.5635 - val_accuracy: 0.9606\n", 322 | "Epoch 23/50\n", 323 | "52/52 [==============================] - 5s 101ms/step - loss: 0.6708 - accuracy: 0.9269 - val_loss: 0.5434 - val_accuracy: 0.9660\n", 324 | "Epoch 24/50\n", 325 | "52/52 [==============================] - 5s 97ms/step - loss: 0.6763 - accuracy: 0.9330 - val_loss: 0.5592 - val_accuracy: 0.9678\n", 326 | "Epoch 25/50\n", 327 | "52/52 [==============================] - 5s 95ms/step - loss: 0.6246 - accuracy: 0.9519 - val_loss: 0.5451 - val_accuracy: 0.9678\n", 328 | "Epoch 26/50\n", 329 | "52/52 [==============================] - 5s 94ms/step - loss: 0.6277 - accuracy: 0.9440 - val_loss: 0.6080 - val_accuracy: 0.9445\n", 330 | "Epoch 27/50\n", 331 | "52/52 [==============================] - 5s 97ms/step - loss: 0.5871 - accuracy: 0.9586 - val_loss: 0.6347 - val_accuracy: 0.9338\n", 332 | "Epoch 28/50\n", 333 | "52/52 [==============================] - 5s 97ms/step - loss: 0.6126 - accuracy: 0.9507 - val_loss: 0.5435 - val_accuracy: 0.9732\n", 334 | "Epoch 29/50\n", 335 | "52/52 [==============================] - 5s 99ms/step - loss: 0.6244 - accuracy: 0.9452 - val_loss: 0.5588 - val_accuracy: 0.9660\n", 336 | "Epoch 30/50\n", 337 | "52/52 [==============================] - 5s 100ms/step - loss: 0.6009 - accuracy: 0.9507 - val_loss: 0.5706 - val_accuracy: 0.9571\n", 338 | "Epoch 31/50\n", 339 | "52/52 [==============================] - 5s 99ms/step - loss: 0.5958 - accuracy: 0.9476 - val_loss: 0.5693 - val_accuracy: 0.9642\n", 340 | "Epoch 32/50\n", 341 | "52/52 [==============================] - 5s 101ms/step - loss: 0.6220 - accuracy: 0.9434 - val_loss: 0.5970 - val_accuracy: 0.9517\n", 342 | "Epoch 33/50\n", 343 | "52/52 [==============================] - 5s 98ms/step - loss: 0.6160 - accuracy: 0.9513 - val_loss: 0.5614 - val_accuracy: 0.9517\n", 344 | "Epoch 34/50\n", 345 | "52/52 [==============================] - 5s 99ms/step - loss: 0.5862 - accuracy: 0.9519 - val_loss: 0.5357 - val_accuracy: 0.9732\n", 346 | "Epoch 35/50\n", 347 | "52/52 [==============================] - 5s 99ms/step - loss: 0.5838 - accuracy: 0.9574 - val_loss: 0.5362 - val_accuracy: 0.9714\n", 348 | "Epoch 36/50\n", 349 | "52/52 [==============================] - 5s 101ms/step - loss: 0.5812 - accuracy: 0.9604 - val_loss: 0.5459 - val_accuracy: 0.9678\n", 350 | "Epoch 37/50\n", 351 | "52/52 [==============================] - 5s 102ms/step - loss: 0.5821 - accuracy: 0.9580 - val_loss: 0.5584 - val_accuracy: 0.9642\n", 352 | "Epoch 38/50\n", 353 | "52/52 [==============================] - 5s 101ms/step - loss: 0.5618 - accuracy: 0.9671 - val_loss: 0.5632 - val_accuracy: 0.9642\n", 354 | "Epoch 39/50\n", 355 | "52/52 [==============================] - 5s 100ms/step - loss: 0.5758 - accuracy: 0.9653 - val_loss: 0.5582 - val_accuracy: 0.9696\n", 356 | "Epoch 40/50\n", 357 | "52/52 [==============================] - 5s 99ms/step - loss: 0.5609 - accuracy: 0.9635 - val_loss: 0.5476 - val_accuracy: 0.9660\n", 358 | "Epoch 41/50\n", 359 | "52/52 [==============================] - 5s 98ms/step - loss: 0.5734 - accuracy: 0.9580 - val_loss: 0.5321 - val_accuracy: 0.9714\n", 360 | "Epoch 42/50\n", 361 | "52/52 [==============================] - 5s 99ms/step - loss: 0.5685 - accuracy: 0.9610 - val_loss: 0.5319 - val_accuracy: 0.9660\n", 362 | "Epoch 43/50\n", 363 | "52/52 [==============================] - 5s 99ms/step - loss: 0.5703 - accuracy: 0.9647 - val_loss: 0.5415 - val_accuracy: 0.9642\n", 364 | "Epoch 44/50\n", 365 | "52/52 [==============================] - 5s 100ms/step - loss: 0.5656 - accuracy: 0.9647 - val_loss: 0.6156 - val_accuracy: 0.9499\n", 366 | "Epoch 45/50\n", 367 | "52/52 [==============================] - 5s 99ms/step - loss: 0.5508 - accuracy: 0.9665 - val_loss: 0.5723 - val_accuracy: 0.9553\n", 368 | "Epoch 46/50\n", 369 | "52/52 [==============================] - 5s 100ms/step - loss: 0.5417 - accuracy: 0.9653 - val_loss: 0.5149 - val_accuracy: 0.9714\n", 370 | "Epoch 47/50\n", 371 | "52/52 [==============================] - 5s 102ms/step - loss: 0.5463 - accuracy: 0.9683 - val_loss: 0.5333 - val_accuracy: 0.9678\n", 372 | "Epoch 48/50\n", 373 | "52/52 [==============================] - 5s 101ms/step - loss: 0.5394 - accuracy: 0.9742 - val_loss: 0.5494 - val_accuracy: 0.9642\n", 374 | "Epoch 49/50\n", 375 | "52/52 [==============================] - 5s 100ms/step - loss: 0.5433 - accuracy: 0.9702 - val_loss: 0.5362 - val_accuracy: 0.9660\n", 376 | "Epoch 50/50\n", 377 | "52/52 [==============================] - 5s 102ms/step - loss: 0.5608 - accuracy: 0.9653 - val_loss: 0.5225 - val_accuracy: 0.9785\n" 378 | ] 379 | } 380 | ] 381 | }, 382 | { 383 | "cell_type": "markdown", 384 | "metadata": { 385 | "id": "oAw1dFaKGDnU" 386 | }, 387 | "source": [ 388 | "**MODEL EVALUATION:**" 389 | ] 390 | }, 391 | { 392 | "cell_type": "code", 393 | "metadata": { 394 | "colab": { 395 | "base_uri": "https://localhost:8080/" 396 | }, 397 | "id": "D25QXmtsFzy3", 398 | "outputId": "b25a82ab-fe9c-4cea-cdbb-9a9360ab1fc0" 399 | }, 400 | "source": [ 401 | "#@ INITIALIZING MODEL EVALUATION: \n", 402 | "predictions = model.predict(testX, batch_size=32) # Initializing Predictions. \n", 403 | "print(classification_report(testY.argmax(axis=1), \n", 404 | " predictions.argmax(axis=1), \n", 405 | " target_names=lb.classes_)) # Inspecting Classification Report. " 406 | ], 407 | "execution_count": 12, 408 | "outputs": [ 409 | { 410 | "output_type": "stream", 411 | "name": "stdout", 412 | "text": [ 413 | " precision recall f1-score support\n", 414 | "\n", 415 | " Faces 0.96 0.99 0.97 109\n", 416 | " Leopards 0.96 0.88 0.92 50\n", 417 | " Motorbikes 0.98 0.99 0.99 200\n", 418 | " airplanes 0.99 0.98 0.99 200\n", 419 | "\n", 420 | " accuracy 0.98 559\n", 421 | " macro avg 0.97 0.96 0.97 559\n", 422 | "weighted avg 0.98 0.98 0.98 559\n", 423 | "\n" 424 | ] 425 | } 426 | ] 427 | }, 428 | { 429 | "cell_type": "code", 430 | "metadata": { 431 | "colab": { 432 | "base_uri": "https://localhost:8080/", 433 | "height": 299 434 | }, 435 | "id": "CZwb2iVtHHJD", 436 | "outputId": "3aca53d8-6013-4021-a2f2-8ca5be1b9130" 437 | }, 438 | "source": [ 439 | "#@ PLOTTING TRAINING LOSS AND ACCURACY: \n", 440 | "N = epochs \n", 441 | "plt.style.use(\"ggplot\")\n", 442 | "plt.figure()\n", 443 | "plt.plot(np.arange(0, N), H.history[\"loss\"], label=\"train_loss\")\n", 444 | "plt.plot(np.arange(0, N), H.history[\"val_loss\"], label=\"val_loss\")\n", 445 | "plt.plot(np.arange(0, N), H.history[\"accuracy\"], label=\"train_acc\")\n", 446 | "plt.plot(np.arange(0, N), H.history[\"val_accuracy\"], label=\"val_acc\")\n", 447 | "plt.title(\"Training Loss and Accuracy\")\n", 448 | "plt.xlabel(\"Epochs\")\n", 449 | "plt.ylabel(\"Loss/Accuracy\")\n", 450 | "plt.legend(loc=\"upper right\")\n", 451 | "plt.show();" 452 | ], 453 | "execution_count": 15, 454 | "outputs": [ 455 | { 456 | "output_type": "display_data", 457 | "data": { 458 | "image/png": "\n", 459 | "text/plain": [ 460 | "
" 461 | ] 462 | }, 463 | "metadata": {} 464 | } 465 | ] 466 | } 467 | ] 468 | } --------------------------------------------------------------------------------