├── Code.ipynb
├── README.md
├── d1-dataset-mri-and-d2-dataset-ct-scan.ipynb
├── drifa-net.ipynb
└── uncertainty-quantification-of-drifa-net.ipynb
/Code.ipynb:
--------------------------------------------------------------------------------
1 | {"metadata":{"kernelspec":{"language":"python","display_name":"Python 3","name":"python3"},"language_info":{"name":"python","version":"3.10.14","mimetype":"text/x-python","codemirror_mode":{"name":"ipython","version":3},"pygments_lexer":"ipython3","nbconvert_exporter":"python","file_extension":".py"},"kaggle":{"accelerator":"gpu","dataSources":[{"sourceId":1079953,"sourceType":"datasetVersion","datasetId":601280},{"sourceId":7957702,"sourceType":"datasetVersion","datasetId":4680825},{"sourceId":8031909,"sourceType":"datasetVersion","datasetId":4734294}],"dockerImageVersionId":30787,"isInternetEnabled":true,"language":"python","sourceType":"notebook","isGpuEnabled":true}},"nbformat_minor":4,"nbformat":4,"cells":[{"cell_type":"code","source":"import cv2\nimport seaborn as sns\nimport matplotlib.pyplot as plt\nimport numpy as np\nimport pandas as pd\nimport plotly.express as px\nsns.set_style('whitegrid')\nfrom sklearn.metrics import confusion_matrix , classification_report\nimport tensorflow as tf\nfrom tensorflow import keras\nfrom tensorflow.keras.models import Sequential\nfrom tensorflow.keras.layers import Dense , Flatten , Conv2D , MaxPooling2D , Dropout , Activation , BatchNormalization\nfrom tensorflow.keras.preprocessing.image import ImageDataGenerator\nfrom tensorflow.keras.optimizers import Adam , Adamax\nfrom tensorflow.keras import regularizers\n\n#Warnings\nimport warnings\nwarnings.filterwarnings('ignore')","metadata":{"_uuid":"8f2839f25d086af736a60e9eeb907d3b93b6e0e5","_cell_guid":"b1076dfc-b9ad-4769-8c92-a6c4dae69d19","trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"import tensorflow as tf\ntf.keras.mixed_precision.set_global_policy('mixed_float16')\n\nimport tensorflow as tf\nimport numpy as np\nimport numpy as np\nimport tensorflow as tf\nfrom tensorflow.keras.layers import Input, Conv2D, MaxPooling2D, Flatten, Dense, Dropout, GlobalAveragePooling2D, BatchNormalization, ReLU, Add\nfrom tensorflow.keras.models import Model\nfrom tensorflow.keras.losses import KLDivergence\nfrom tensorflow.keras.callbacks import ModelCheckpoint, EarlyStopping\nfrom tensorflow.keras.utils import to_categorical\nfrom tensorflow.keras.datasets import cifar10\nfrom tensorflow.keras.applications import EfficientNetB0\nfrom tensorflow.keras.applications import DenseNet121, ResNet50V2\nfrom tensorflow.keras.layers import GlobalAveragePooling2D\nimport copy\nimport numpy as np\nimport tensorflow as tf\nfrom tensorflow.keras.layers import Input, Conv2D, MaxPooling2D, Flatten, Dense, Dropout, GlobalAveragePooling2D, BatchNormalization, ReLU, Add\nfrom tensorflow.keras.models import Model\nfrom tensorflow.keras.losses import KLDivergence\nfrom tensorflow.keras.callbacks import ModelCheckpoint, EarlyStopping\nfrom tensorflow.keras.utils import to_categorical\nfrom tensorflow.keras.datasets import cifar10\nfrom tensorflow.keras.applications import EfficientNetB0\nfrom tensorflow.keras.applications import DenseNet169, MobileNetV2, ResNet50, EfficientNetB0\nfrom tensorflow.keras.layers import GlobalAveragePooling2D\nimport copy\n\nimport tensorflow as tf\nfrom tensorflow.keras import layers\nimport tensorflow as tf\nfrom tensorflow.keras import layers\n","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"X_train_h = np.load('X_train_HAM10000_ISIC_2018.npy')\ny_train_h = np.load('y_train_HAM10000_ISIC_2018.npy')\nX_test_h = np.load('X_test_HAM10000_ISIC_2018.npy')\ny_test_h = np.load('y_test_HAM10000_ISIC_2018.npy')\n\n\nX_train_h.shape, y_train_h.shape, X_test_h.shape, y_test_h.shape\n","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"random_indices = np.random.choice(2003, 810, replace=False)\n\nX_test_h1 = X_test_h[random_indices]\ny_test_h1 = y_test_h[random_indices]\n\nX_test_h1.shape, y_test_h1.shape, X_test_h.shape, y_test_h.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"#X_train_s.shape,X_test_s.shape, y_train_s.shape,y_test_s.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"X_train_h.shape, y_train_h.shape, X_test_h.shape, y_test_h.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"X_train_s = np.load('/kaggle/input/spikamed-ds/data_cervical_cancer_sipkamed.npy')\ny_train_s = np.load('/kaggle/input/spikamed-ds/labels_cervical_cancer_sipkamed.npy')\n\nX_train_s.shape, y_train_s.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"from sklearn.model_selection import train_test_split\n\nX_train_s, X_test_s, y_train_s, y_test_s = train_test_split(X_train_s, y_train_s, test_size=0.2, random_state=42)\n\nX_train_s.shape,X_test_s.shape, y_train_s.shape,y_test_s.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"import numpy as np\nimport cv2\n\ndef rotate_image(image, angle):\n \"\"\"\n Rotate the image by the specified angle.\n \"\"\"\n center = tuple(np.array(image.shape[1::-1]) / 2)\n rotation_matrix = cv2.getRotationMatrix2D(center, angle, 1.0)\n rotated_image = cv2.warpAffine(image, rotation_matrix, image.shape[1::-1], flags=cv2.INTER_LINEAR)\n return rotated_image\n\ndef translate_image(image, tx, ty):\n \"\"\"\n Translate the image by the specified translation parameters.\n \"\"\"\n translation_matrix = np.float32([[1, 0, tx], [0, 1, ty]])\n translated_image = cv2.warpAffine(image, translation_matrix, image.shape[1::-1])\n return translated_image\n\n# Example data\n#X_train = np.random.rand(100, 28, 28) # Assuming 100 images of size 28x28\n#y_train = np.random.randint(0, 10, 100) # Assuming 100 labels\n\n# Augmentation parameters\nrotation_angles = [20]\ntranslations = [(5, 5)]\n\naugmented_X_train = []\naugmented_y_train = []\n\nfor image, label in zip(X_train_s, y_train_s):\n # Original image\n #augmented_X_train.append(image)\n #augmented_y_train.append(label)\n\n # Augment with rotations\n for angle in rotation_angles:\n rotated_image = rotate_image(image, angle)\n augmented_X_train.append(rotated_image)\n augmented_y_train.append(label)\n\n # Augment with translations\n for tx, ty in translations:\n translated_image = translate_image(image, tx, ty)\n augmented_X_train.append(translated_image)\n augmented_y_train.append(label)\n\n# Convert lists to numpy arrays\naugmented_X_train = np.array(augmented_X_train)\naugmented_y_train = np.array(augmented_y_train)\n\n# Shuffle the data\nshuffle_indices = np.random.permutation(len(augmented_X_train))\naugmented_X_train = augmented_X_train[shuffle_indices]\naugmented_y_train = augmented_y_train[shuffle_indices]\naugmented_X_train.shape, augmented_y_train.shape\n# Now, augmented_X_train and augmented_y_train contain the augmented dataset.","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"random_indices = np.random.choice(6478, 4773, replace=False)\n\naugmented_X_train = augmented_X_train[random_indices]\naugmented_y_train = augmented_y_train[random_indices]\n\naugmented_X_train.shape, augmented_y_train.shape\n","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"X_train_s = np.concatenate((X_train_s, augmented_X_train), axis=0)\ny_train_s = np.concatenate((y_train_s, augmented_y_train), axis=0)\nX_train_s.shape, y_train_s.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"'''X_train_s = np.concatenate((X_train_s, X_train_s, X_train_s), axis=0)\ny_train_s = np.concatenate((y_train_s, y_train_s, y_train_s), axis=0)\nX_train_s.shape, y_train_s.shape'''","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"X_test_s1 = np.concatenate((X_test_s, X_test_s, X_test_s), axis=0)\ny_test_s1 = np.concatenate((y_test_s, y_test_s, y_test_s), axis=0)\nX_test_s1.shape, y_test_s1.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"X_train_s.shape, y_train_s.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"augmented_X_train.shape, augmented_y_train.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"random_indices = np.random.choice(2430, 2003, replace=False)\n\nX_test_s1 = X_test_s1[random_indices]\ny_test_s1 = y_test_s1[random_indices]\n\nX_test_s1.shape, y_test_s1.shape, X_test_s.shape, y_test_s.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"#X_train.shape, y_train.shape, X_test.shape, y_test.shape, \nX_train_s.shape,X_test_s.shape, y_train_s.shape,y_test_s.shape, X_test_s1.shape, y_test_s1.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"print(X_train_h.shape, y_train_h.shape, X_test_h.shape, y_test_h.shape,\n#X_train.shape, y_train.shape, X_test.shape, y_test.shape,\nX_train_s.shape,X_test_s.shape, X_test_s1.shape, y_train_s.shape,y_test_s.shape, y_test_s1.shape)","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"markdown","source":"**Multi-branch fusion attention (MFA) module**","metadata":{}},{"cell_type":"code","source":"#### Multi-branch fusion attention (MFA) module #####\n\nclass DeeperGlobalLocalAttentionLayer1(layers.Layer):\n def __init__(self, units, activation='sigmoid', dropout_rate=0.2, use_scale=True, axis=-1, **kwargs):\n super(DeeperGlobalLocalAttentionLayer1, self).__init__(**kwargs)\n self.units = units\n self.activation = activation\n self.dropout_rate = dropout_rate\n self.use_scale = use_scale\n self.axis = axis\n\n def build(self, input_shape):\n _, _, _, channels = input_shape\n self.global_conv1 = layers.Conv2D(filters=self.units, kernel_size=(1, 1), activation=self.activation)\n self.global_avg_pooling1 = layers.GlobalAveragePooling2D()\n \n self.global_conv2 = layers.Conv2D(filters=self.units, kernel_size=(1, 1), activation=self.activation)\n self.global_avg_pooling2 = layers.GlobalMaxPooling2D()\n \n self.global_conv3 = layers.Conv2D(filters=self.units, kernel_size=(1, 1), activation=self.activation)\n self.global_avg_pooling3 = layers.GlobalAveragePooling2D()\n \n self.global_conv4 = layers.Conv2D(filters=self.units, kernel_size=(1, 1), activation=self.activation)\n self.global_avg_pooling4 = layers.GlobalMaxPooling2D()\n \n self.concat1 = layers.Add()\n self.concat2 = layers.Add()\n self.concat3 = layers.Add()\n self.concat4 = layers.Add()\n self.concat5 = layers.Concatenate(axis=-1)\n \n self.global_attention = layers.Dense(units=self.units, activation=self.activation)\n \n self.local_conv1 = layers.Conv2D(filters=self.units, kernel_size=(1, 1), activation=self.activation)\n self.local_conv2 = layers.Conv2D(filters=self.units, kernel_size=(1, 1), activation=self.activation)\n self.concat6 = layers.Add()\n \n if self.use_scale:\n self.global_scale = self.add_weight(shape=(1, 1, 1, 1), initializer='ones', trainable=True, name='global_scale')\n self.local_scale = self.add_weight(shape=(1, 1, 1, self.units), initializer='ones', trainable=True, name='local_scale')\n \n super(DeeperGlobalLocalAttentionLayer1, self).build(input_shape)\n\n def call(self, inputs, training=None):\n ##### Hierarchical Information Fusion Attention(HIFA) ######\n \n global_attention1 = self.global_conv1(inputs)\n global_avg1 = self.global_avg_pooling1(global_attention1)\n \n global_attention2 = self.global_conv2(global_attention1)\n global_avg2 = self.global_avg_pooling2(global_attention2)\n \n global_concat1 = self.concat1([global_avg1, global_avg2])\n global_attention_concat1 = self.concat2([global_attention1, global_attention2])\n \n global_attention3 = self.global_conv3(global_attention_concat1)\n global_avg3 = self.global_avg_pooling3(global_attention3)\n \n global_attention4 = self.global_conv4(global_attention3)\n global_avg4 = self.global_avg_pooling4(global_attention4)\n \n global_concat2 = self.concat3([global_avg3, global_avg4])\n global_attention_concat2 = self.concat4([global_attention3, global_attention4])\n \n global_avg_concat = self.concat5([global_concat1, global_concat2])\n \n global_attention = self.global_attention(global_avg_concat)\n global_attention = tf.expand_dims(tf.expand_dims(global_attention, 1), 1)\n\n ##### Channel-wise Local Information Attention (CLIA) ######\n \n local_attention1 = self.local_conv1(inputs)\n local_attention1 = tf.reduce_mean(local_attention1, axis=[1, 2], keepdims=True) # Reduce spatial dimensions\n local_attention2 = self.local_conv2(local_attention1)\n local_attention2 = tf.reduce_mean(local_attention2, axis=[1, 2], keepdims=True) # Reduce spatial dimensions\n \n local_attention = self.concat6([local_attention1, local_attention2])\n \n # Scale Global and Local Attention\n if self.use_scale:\n global_attention *= self.global_scale\n local_attention *= self.local_scale\n\n # Combine Global and Local Attention\n attention = tf.sigmoid(global_attention + local_attention)\n return attention\n\n def get_config(self):\n config = super(DeeperGlobalLocalAttentionLayer1, self).get_config()\n config.update({'units': self.units, 'activation': self.activation, 'dropout_rate': self.dropout_rate,\n 'use_scale': self.use_scale})\n return config\n\nclass DeeperAttentionLayer1(layers.Layer):\n def __init__(self, units=64, use_scale=True, **kwargs):\n super(DeeperAttentionLayer1, self).__init__(**kwargs)\n self.units = units\n self.use_scale = use_scale\n\n def build(self, input_shape):\n _, H, W, C = input_shape\n self.alpha = self.add_weight(shape=(1, 1, 1, C), initializer='ones', trainable=True, name='alpha')\n self.deeper_global_local_attention = DeeperGlobalLocalAttentionLayer1(units=self.units, activation='sigmoid', \n dropout_rate=0.2, # You can adjust the dropout rate\n use_scale=self.use_scale)\n super(DeeperAttentionLayer1, self).build(input_shape)\n\n def call(self, inputs, training=None):\n attention = self.deeper_global_local_attention(inputs, training=training)\n attention_feature = inputs * attention * self.alpha\n return attention_feature\n\n def get_config(self):\n config = super(DeeperAttentionLayer1, self).get_config()\n config.update({'units': self.units, 'use_scale': self.use_scale})\n return config\n","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"markdown","source":"**Multimodal information fusion attention (MIFA)**","metadata":{}},{"cell_type":"code","source":"########## Multimodal information fusion attention (MIFA) ###############\n\n\n\nclass GlobalMinPooling2D(layers.Layer):\n def __init__(self, **kwargs):\n super(GlobalMinPooling2D, self).__init__(**kwargs)\n\n def call(self, inputs):\n return tf.reduce_min(inputs, axis=[1, 2])\n\n def compute_output_shape(self, input_shape):\n return (input_shape[0], input_shape[-1])\n\n def get_config(self):\n config = super(GlobalMinPooling2D, self).get_config()\n return config\n\n\nclass DeeperGlobalLocalAttentionLayer(layers.Layer):\n def __init__(self, units, activation='sigmoid', dropout_rate=0.2, use_scale=True, axis=-1, **kwargs):\n super(DeeperGlobalLocalAttentionLayer, self).__init__(**kwargs)\n self.units = units\n self.activation = activation\n self.dropout_rate = dropout_rate\n self.use_scale = use_scale\n self.axis = axis\n\n def build(self, input_shapes):\n input_shape1, input_shape2 = input_shapes\n _, _, _, channels1 = input_shape1\n _, _, _, channels2 = input_shape2\n \n self.global_min_pooling1 = GlobalMinPooling2D()\n self.global_avg_pooling1 = layers.GlobalAveragePooling2D()\n self.global_max_pooling1 = layers.GlobalMaxPooling2D()\n \n self.global_attention = layers.Dense(units=self.units, activation=self.activation)\n \n self.global_min_pooling2 = GlobalMinPooling2D()\n self.global_avg_pooling2 = layers.GlobalAveragePooling2D()\n self.global_max_pooling2 = layers.GlobalMaxPooling2D()\n \n #self.global_attention2 = layers.Dense(units=self.units, activation=self.activation)\n \n \n self.concat = layers.Add()\n #self.global_attention3 = layers.Dense(units=self.units, activation=self.activation)\n \n self.local_conv1 = layers.Conv2D(filters=self.units, kernel_size=(1, 1), activation=self.activation)\n self.local_conv2 = layers.Conv2D(filters=self.units, kernel_size=(1, 1), activation=self.activation)\n \n \n \n self.concat2 = layers.Add()\n #self.local_conv5 = layers.Conv2D(filters=self.units, kernel_size=(1, 1), activation=self.activation)\n \n if self.use_scale:\n self.global_scale = self.add_weight(shape=(1, 1, 1, 1), initializer='ones', trainable=True, name='global_scale')\n self.local_scale = self.add_weight(shape=(1, 1, 1, self.units), initializer='ones', trainable=True, name='local_scale')\n \n super(DeeperGlobalLocalAttentionLayer, self).build(input_shapes)\n\n def call(self, inputs, training=None):\n inputs1, inputs2 = inputs\n\n ######### Multimodal Global Information Fusion Attention (MGIFA) #########\n global_min1 = self.global_min_pooling1(inputs1)\n global_avg1 = self.global_avg_pooling1(inputs1)\n global_max1 = self.global_max_pooling1(inputs1)\n\n global_min2 = self.global_min_pooling2(inputs2)\n global_avg2 = self.global_avg_pooling2(inputs2)\n global_max2 = self.global_max_pooling2(inputs2)\n\n concat_min = self.concat([global_min1, global_min2])\n concat_avg = self.concat([global_avg1, global_avg2])\n concat_max = self.concat([global_max1, global_max2])\n \n concat_min = self.global_attention(concat_min)\n concat_avg = self.global_attention(concat_avg)\n concat_max = self.global_attention(concat_max)\n \n concat_global_attention = self.concat([concat_min, concat_avg, concat_max])\n \n #global_attention = self.global_attention3(concat_global_attention)\n \n global_attention = tf.expand_dims(tf.expand_dims(concat_global_attention, 1), 1)\n\n ######### Multimodal Local Information Fusion Attention (MLIFA) #########\n \n local_conv1 = self.local_conv1(inputs1)\n local_min1 = tf.reduce_min(local_conv1, axis=[1, 2], keepdims=True) # Reduce spatial dimensions\n local_avg1 = tf.reduce_mean(local_conv1, axis=[1, 2], keepdims=True) # Reduce spatial dimensions\n local_max1 = tf.reduce_max(local_conv1, axis=[1, 2], keepdims=True) # Reduce spatial dimensions\n \n local_conv2 = self.local_conv2(inputs2)\n local_min2 = tf.reduce_min(local_conv2, axis=[1, 2], keepdims=True) # Reduce spatial dimensions\n local_avg2 = tf.reduce_mean(local_conv2, axis=[1, 2], keepdims=True) # Reduce spatial dimensions\n local_max2 = tf.reduce_max(local_conv2, axis=[1, 2], keepdims=True) # Reduce spatial dimensions\n \n local_concat_min = self.concat2([local_min1, local_min2])\n local_concat_avg = self.concat2([local_avg1, local_avg2])\n local_concat_max = self.concat2([local_max1, local_max2])\n\n local_attention = self.concat2([local_concat_min, local_concat_avg, local_concat_max])\n \n \n # Scale Global and Local Attention\n if self.use_scale:\n global_attention *= self.global_scale\n local_attention *= self.local_scale\n\n # Combine Global and Local Attention\n attention = tf.sigmoid(global_attention + local_attention)\n return attention\n\n def get_config(self):\n config = super(DeeperGlobalLocalAttentionLayer, self).get_config()\n config.update({'units': self.units, 'activation': self.activation, 'dropout_rate': self.dropout_rate,\n 'use_scale': self.use_scale})\n return config\n\nclass DeeperAttentionLayer(layers.Layer):\n def __init__(self, units=64, use_scale=True,axis=-1, **kwargs):\n super(DeeperAttentionLayer, self).__init__(**kwargs)\n self.units = units\n self.use_scale = use_scale\n self.axis = axis \n\n def build(self, input_shapes):\n input_shape1, input_shape2 = input_shapes\n _, H, W, C1 = input_shape1\n _, H, W, C2 = input_shape2\n \n self.alpha1 = self.add_weight(shape=(1, 1, 1, C1), initializer='ones', trainable=True, name='alpha1')\n self.alpha2 = self.add_weight(shape=(1, 1, 1, C2), initializer='ones', trainable=True, name='alpha2')\n \n self.deeper_global_local_attention = DeeperGlobalLocalAttentionLayer(units=self.units, activation='sigmoid', \n dropout_rate=0.2, # You can adjust the dropout rate\n use_scale=self.use_scale)\n #self.concat3 = layers.Add()\n #self.concat4 = layers.Add()\n \n super(DeeperAttentionLayer, self).build(input_shapes)\n\n def call(self, inputs, training=None):\n inputs1, inputs2 = inputs\n attention = self.deeper_global_local_attention([inputs1, inputs2], training=training)\n \n #inputs_concat = self.concat3([inputs1, inputs2])\n #alpha_concat = self.concat4([self.alpha1, self.alpha2])\n \n attention_feature1 = inputs1 * attention * self.alpha1\n attention_feature2 = inputs2 * attention * self.alpha2\n \n return attention_feature1, attention_feature2\n\n def get_config(self):\n config = super(DeeperAttentionLayer, self).get_config()\n config.update({'units': self.units, 'use_scale': self.use_scale})\n return config\n","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"### RRA block ########\n\ndef RGSA(x, filters, strides=(1, 1), use_projection=False):\n shortcut = x\n\n # Define the first convolutional layer of the block\n \n x = Conv2D(filters=filters, kernel_size=(3, 3), strides=strides, padding='same', \n #activation = 'relu'\n\n )(x)\n x = DeeperAttentionLayer1(units=filters, use_scale=True)(x)\n x = BatchNormalization()(x)\n x = tf.keras.layers.Activation('relu')(x)\n\n # Define the second convolutional layer of the block\n \n x = Conv2D(filters=filters, kernel_size=(3, 3), padding='same')(x)\n x = DeeperAttentionLayer1(units=filters, use_scale=True)(x)\n \n x = BatchNormalization()(x)\n\n # If the stride is not (1, 1), the dimensions need to be adjusted\n if strides != (1, 1) or use_projection:\n \n shortcut = Conv2D(filters=filters, kernel_size=(1, 1), strides=strides, padding='same')(shortcut)\n shortcut = BatchNormalization()(shortcut)\n\n # Add the shortcut (identity connection)\n \n x = tf.keras.layers.add([x, shortcut])\n \n x = tf.keras.layers.Activation('relu')(x)\n return x\n","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"def residual_GLC_branch1(inputs1, inputs2):\n \n x1 = Conv2D(filters=64, kernel_size=(7, 7), strides=(2, 2), padding='same')(inputs1)\n x1 = DeeperAttentionLayer1(units=64, use_scale=True)(x1) ## MFA ####\n x1 = BatchNormalization()(x1)\n x1 = tf.keras.layers.Activation('relu')(x1)\n x1 = MaxPooling2D(pool_size=(3, 3), strides=(2, 2), padding='same')(x1)\n \n x2 = Conv2D(filters=64, kernel_size=(7, 7), strides=(2, 2), padding='same')(inputs2)\n x2 = DeeperAttentionLayer1(units=64, use_scale=True)(x2) ## MFA ####\n x2 = BatchNormalization()(x2)\n x2 = tf.keras.layers.Activation('relu')(x2)\n x2 = MaxPooling2D(pool_size=(3, 3), strides=(2, 2), padding='same')(x2)\n \n\n x1 = RGSA(x1, filters=64)\n x1 = tf.keras.layers.Dropout(0.25)(x1, training = True) ## MCD ####\n x1 = DeeperAttentionLayer1(units=64, use_scale=True)(x1) ## MFA ####\n\n x2 = RGSA(x2, filters=64)\n x2 = tf.keras.layers.Dropout(0.25)(x2, training = True) ## MCD ####\n x2 = DeeperAttentionLayer1(units=64, use_scale=True)(x2)\n \n x1, x2 = DeeperAttentionLayer(units=64, use_scale=True)([x1, x2]) ## MIFA ####\n \n x1 = RGSA(x1, filters=64)\n x1 = tf.keras.layers.Dropout(0.25)(x1, training = True) ## MCD ####\n x1 = DeeperAttentionLayer1(units=64, use_scale=True)(x1) ## MFA ####\n \n x2 = RGSA(x2, filters=64)\n x2 = tf.keras.layers.Dropout(0.25)(x2, training = True) ## MCD ####\n x2 = DeeperAttentionLayer1(units=64, use_scale=True)(x2)\n\n x1, x2 = DeeperAttentionLayer(units=64, use_scale=True)([x1, x2]) ## MIFA ####\n \n x1 = RGSA(x1, filters=128, strides=(2, 2), use_projection=True)\n x1 = tf.keras.layers.Dropout(0.25)(x1, training = True) ## MCD ####\n x1 = DeeperAttentionLayer1(units=128, use_scale=True)(x1) ## MFA ####\n\n x2 = RGSA(x2, filters=128, strides=(2, 2), use_projection=True)\n x2 = tf.keras.layers.Dropout(0.25)(x2, training = True) ## MCD ####\n x2 = DeeperAttentionLayer1(units=128, use_scale=True)(x2)\n\n x1, x2 = DeeperAttentionLayer(units=128, use_scale=True)([x1, x2]) ## MIFA ####\n \n x1 = RGSA(x1, filters=128)\n x1 = tf.keras.layers.Dropout(0.25)(x1, training = True) ## MCD ####\n x1 = DeeperAttentionLayer1(units=128, use_scale=True)(x1)\n \n x2 = RGSA(x2, filters=128)\n x2 = tf.keras.layers.Dropout(0.25)(x2, training = True) ## MCD ####\n x2 = DeeperAttentionLayer1(units=128, use_scale=True)(x2)\n\n x1, x2 = DeeperAttentionLayer(units=128, use_scale=True)([x1, x2]) ## MIFA ####\n \n x1 = RGSA(x1, filters=256, strides=(2, 2), use_projection=True)\n x1 = tf.keras.layers.Dropout(0.25)(x1, training = True) ## MCD ####\n x1 = DeeperAttentionLayer1(units=256, use_scale=True)(x1)\n \n x2 = RGSA(x2, filters=256, strides=(2, 2), use_projection=True)\n x2 = tf.keras.layers.Dropout(0.25)(x2, training = True) ## MCD ####\n x2 = DeeperAttentionLayer1(units=256, use_scale=True)(x2)\n\n x1, x2 = DeeperAttentionLayer(units=256, use_scale=True)([x1, x2]) ## MIFA ####\n \n \n x1 = RGSA(x1, filters=256)\n x1 = tf.keras.layers.Dropout(0.25)(x1, training = True) ## MCD ####\n x1 = DeeperAttentionLayer1(units=256, use_scale=True)(x1)\n \n x2 = RGSA(x2, filters=256)\n x2 = tf.keras.layers.Dropout(0.25)(x2, training = True) ## MCD ####\n x2 = DeeperAttentionLayer1(units=256, use_scale=True)(x2)\n \n x1, x2 = DeeperAttentionLayer(units=256, use_scale=True)([x1, x2]) ## MIFA ####\n\n x1 = RGSA(x1, filters=512, strides=(2, 2), use_projection=True)\n x1 = DeeperAttentionLayer1(units=512, use_scale=True)(x1)\n \n x2 = RGSA(x2, filters=512, strides=(2, 2), use_projection=True)\n x2 = DeeperAttentionLayer1(units=512, use_scale=True)(x2)\n\n x1, x2 = DeeperAttentionLayer(units=512, use_scale=True)([x1, x2]) ## MIFA ####\n \n x1 = RGSA(x1, filters=512)\n x2 = RGSA(x2, filters=512)\n x1, x2 = DeeperAttentionLayer(units=512, use_scale=True)([x1, x2])\n \n return x1, x2","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"#def build_resnet18(input_shape=(128, 128, 3), num_classes=2):\ninput_shape=(128, 128, 3)\ninputs1 = Input(shape=input_shape)\ninputs2 = Input(shape=input_shape)\n\n\n\n#input_data = Input(shape=input_shape, name='input_data')\n# Initial convolutional layer\n\nx1, x2 = residual_GLC_branch1(inputs1, inputs2)\n#print('x:',x.shape)\n\ncon = tf.keras.layers.Concatenate(axis=-1)([x1, x2])\n\ncon = tf.keras.layers.Dropout(0.25)(con, training = True) ## MCD ####\n\nx = GlobalAveragePooling2D()(con)\nprint('GlobalAveragePooling2D x:',x.shape)\n\noutputs1 = Dense(5, activation='softmax')(x)\noutputs2 = Dense(7, activation='softmax')(x)\n\n# Create the model\nmodel = Model([inputs1, inputs2], [outputs1, outputs2])\n#return model\nprint(model.summary())","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"from tensorflow.keras.optimizers import Adam\nfrom tensorflow.keras.optimizers.schedules import ExponentialDecay\n\ninitial_gamma = 0.5\n\noptimizer = Adam(learning_rate=0.001)\n# Compile the model with the custom optimizer\nmodel.compile(optimizer=optimizer,\n loss=['categorical_crossentropy', 'categorical_crossentropy'],\n loss_weights=[initial_gamma, (1 - initial_gamma)],\n metrics=['accuracy', 'accuracy'])\n\n\nfrom tensorflow.keras.callbacks import ModelCheckpoint, EarlyStopping\ndef checkpoint_callback():\n\n checkpoint_filepath = 'best1_model_cer_skin_lung.keras'\n\n model_checkpoint_callback= ModelCheckpoint(filepath=checkpoint_filepath,\n save_weights_only=False,\n #frequency='epoch',\n monitor='val_loss',\n save_best_only=True,\n mode='min',\n verbose=0)\n\n return model_checkpoint_callback\n\ndef early_stopping(patience):\n es_callback = tf.keras.callbacks.EarlyStopping(monitor='val_loss', patience=patience, verbose=1)\n return es_callback\n\n\n\nfrom tensorflow.keras.callbacks import ReduceLROnPlateau\n\nreduce_lr = ReduceLROnPlateau(monitor='val_loss', factor=0.2,\n patience=5, min_lr=0.00001)\n\ncheckpoint_callback = checkpoint_callback()\n\nearly_stopping = early_stopping(patience=100)\ncallbacks = [checkpoint_callback, early_stopping, reduce_lr]\n \n\n# Fit the model with callbacks\nhistory = model.fit([X_train_s, X_train_h], [y_train_s, y_train_h],\n epochs=200,\n validation_split=0.2, verbose=1,\n shuffle=True,\n callbacks=callbacks) # UpdateGammaCallback\n","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"model.evaluate([X_test_s, X_test_h1], [y_test_s, y_test_h1])","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"\nmodel.evaluate([X_test_s1, X_test_h], [y_test_s1, y_test_h])","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"y_pred = model.predict([X_test_s1, X_test_h]) \n\ny_pred_binary1 = y_pred[0] >= 0.5\ny_pred_binary_pgd_test1 = np.array(y_pred_binary1, dtype='int32')\n\nprint('y_pred_binary_pgd_test1:', y_pred_binary_pgd_test1.shape)\n\ny_pred_binary2 = y_pred[1] >= 0.5\ny_pred_binary_pgd_test2 = np.array(y_pred_binary2, dtype='int32')\n\nprint('y_pred_binary_pgd_test2:', y_pred_binary_pgd_test2.shape)\n\n#y_test_s, y_test_h\n# Calculate evaluation metrics for the current epsilon\ny_test_categorical1 = y_test_s1\ny_test_categorical2 = y_test_h\n\n## Task 1:\nprint('skin cancer classification:')\naccuracy = accuracy_score(y_pred_binary_pgd_test1, y_test_categorical1) * 100\nprecision = precision_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\nrecall = recall_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\nf1 = f1_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\n#auc = roc_auc_score(y_pred, y_train_categorical, multi_class='ovr') * 100\nprint('accuracy:', accuracy)\nprint('precision:', precision)\nprint('recall:', recall)\nprint('f1:', f1)\n\n## Task 2:\nprint('Cervical cancer classification:')\naccuracy = accuracy_score(y_pred_binary_pgd_test2, y_test_categorical2) * 100\nprecision = precision_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nrecall = recall_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nf1 = f1_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nprint('accuracy:', accuracy)\nprint('precision:', precision)\nprint('recall:', recall)\nprint('f1:', f1)","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"history = model.fit([X_train_s, X_train_h], [y_train_s, y_train_h],\n epochs=100,\n validation_split=0.2, verbose=1,\n shuffle=True,\n callbacks=callbacks)","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"model.evaluate([X_test_s, X_test_h1], [y_test_s, y_test_h1])","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"from tensorflow.keras.models import load_model\n\nmodel1 = load_model('/kaggle/working/best1_model_cer_skin_lung.keras', custom_objects={'DeeperAttentionLayer1': DeeperAttentionLayer1,\n 'DeeperAttentionLayer': DeeperAttentionLayer\n })\nmodel1.evaluate([X_test_s, X_test_h1], [y_test_s, y_test_h1])","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"model.evaluate([X_test_s1, X_test_h], [y_test_s1, y_test_h])","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"y_pred = model.predict([X_test_s1, X_test_h]) \n\ny_pred_binary1 = y_pred[0] >= 0.5\ny_pred_binary_pgd_test1 = np.array(y_pred_binary1, dtype='int32')\n\nprint('y_pred_binary_pgd_test1:', y_pred_binary_pgd_test1.shape)\n\ny_pred_binary2 = y_pred[1] >= 0.5\ny_pred_binary_pgd_test2 = np.array(y_pred_binary2, dtype='int32')\n\nprint('y_pred_binary_pgd_test2:', y_pred_binary_pgd_test2.shape)\n\n#y_test_s, y_test_h\n# Calculate evaluation metrics for the current epsilon\ny_test_categorical1 = y_test_s1\ny_test_categorical2 = y_test_h\n\n## Task 1:\nprint('skin cancer classification:')\naccuracy = accuracy_score(y_pred_binary_pgd_test1, y_test_categorical1) * 100\nprecision = precision_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\nrecall = recall_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\nf1 = f1_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\n#auc = roc_auc_score(y_pred, y_train_categorical, multi_class='ovr') * 100\nprint('accuracy:', accuracy)\nprint('precision:', precision)\nprint('recall:', recall)\nprint('f1:', f1)\n\n## Task 2:\nprint('Cervical cancer classification:')\naccuracy = accuracy_score(y_pred_binary_pgd_test2, y_test_categorical2) * 100\nprecision = precision_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nrecall = recall_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nf1 = f1_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nprint('accuracy:', accuracy)\nprint('precision:', precision)\nprint('recall:', recall)\nprint('f1:', f1)","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"y_pred = model.predict([X_test_s, X_test_h1]) \n\ny_pred_binary1 = y_pred[0] >= 0.5\ny_pred_binary_pgd_test1 = np.array(y_pred_binary1, dtype='int32')\n\nprint('y_pred_binary_pgd_test1:', y_pred_binary_pgd_test1.shape)\n\ny_pred_binary2 = y_pred[1] >= 0.5\ny_pred_binary_pgd_test2 = np.array(y_pred_binary2, dtype='int32')\n\nprint('y_pred_binary_pgd_test2:', y_pred_binary_pgd_test2.shape)\n\n#y_test_s, y_test_h\n# Calculate evaluation metrics for the current epsilon\ny_test_categorical1 = y_test_s\ny_test_categorical2 = y_test_h1\n\n## Task 1:\nprint('skin cancer classification:')\naccuracy = accuracy_score(y_pred_binary_pgd_test1, y_test_categorical1) * 100\nprecision = precision_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\nrecall = recall_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\nf1 = f1_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\n#auc = roc_auc_score(y_pred, y_train_categorical, multi_class='ovr') * 100\nprint('accuracy:', accuracy)\nprint('precision:', precision)\nprint('recall:', recall)\nprint('f1:', f1)\n\n## Task 2:\nprint('Cervical cancer classification:')\naccuracy = accuracy_score(y_pred_binary_pgd_test2, y_test_categorical2) * 100\nprecision = precision_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nrecall = recall_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nf1 = f1_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nprint('accuracy:', accuracy)\nprint('precision:', precision)\nprint('recall:', recall)\nprint('f1:', f1)","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"model.save('best_model_ever.keras')","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"","metadata":{"trusted":true},"outputs":[],"execution_count":null}]}
--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
1 | # Welcome to My GitHub Profile 👋
2 |
3 | ## Multimodal Fusion Learning with Dual Attention for Medical Imaging
4 |
5 | Multimodal fusion learning has shown significant promise in classifying various diseases such as skin cancer and brain tumors. However, existing methods face three key limitations:
6 |
7 | 1. **Lack of Generalizability**: Existing methods often fail to generalize across diagnosis tasks due to their focus on a specific disease.
8 | 2. **Limited Use of Diverse Modalities**: They do not fully leverage multiple health records from diverse modalities to learn robust complementary information.
9 | 3. **Single Attention Mechanism**: Relying on a single attention mechanism misses the benefits of combining multiple attention strategies within and across various modalities.
10 |
11 | ### Our Proposed Approach: **DRIFA**
12 |
13 | To address these challenges, we propose:
14 | **A Dual Robust Information Fusion Attention Mechanism** (**DRIFA**)
15 |
16 | ### Key Features of DRIFA:
17 |
18 | - **Multi-Branch Fusion Attention Module**: Enhances representations for each modality, such as dermoscopy, pap smear, MRI, and CT scans.
19 | - **Multimodal Information Fusion Attention Module**: Learns refined multimodal shared representations, improving the network's generalization across multiple tasks.
20 |
21 | DRIFA can be integrated with any deep neural network, forming a multimodal fusion learning framework known as **DRIFA-Net**.
22 |
23 | ### Performance Highlights:
24 |
25 | - **Uncertainty Estimation**: Using an ensemble Monte Carlo dropout strategy, DRIFA-Net provides reliable predictions with uncertainty estimates.
26 | - **State-of-the-Art Results**: Extensive experiments on five publicly available datasets demonstrate consistent performance improvements over existing methods.
27 |
28 | ### Technologies and Applications:
29 | - **Applications**: Disease classification (e.g., skin cancer, brain tumors).
30 | - **Modalities**: Dermoscopy, pap smear, MRI, and CT scans.
31 |
32 |
33 | 
34 | Figure 1. Detailed architecture of DRIFA-Net. Key components include: (A) the target-specific multimodal fusion learning (TMFL)
35 | phase, followed by (B) an uncertainty quantification (UQ) phase. TMFL phase comprises a robust residual attention (RRA) block, shown
36 | in (C), and utilizes multi-branch fusion attention (MFA), an additional MFA module for further refinement of local representations, a
37 | multimodal information fusion attention (MIFA) module for improved multimodal representation learning, and multitask learning (MTL)
38 | for handling multiple classification tasks. During (UQ) phase, the reliability of DRIFA-Net predictions are assessed.
39 |
40 |
41 | 
42 |
43 | Figure 2. (a) Multi-branch fusion attention (MFA) module.Key components include hierarchical information fusion attention (HIFA) for diverse
44 | local information enhancement and channelwise local information attention (CLIA) for improved channelspecific representation learning.
45 |
46 |
47 | 
48 |
49 | Figure 3. (a) Multimodal information fusion attention (MIFA) module. This module includes multimodal global information fusion attention (MGIFA) (shown in b) and multimodal local information fusion attention (MLIFA) (shown in c).
50 |
51 |
52 | 
53 |
54 | Figure 4. Visual representation of the important regions highlighted by our proposed DRIFA-Net and four SOTA methods using the
55 | GRAD-CAM technique on two benchmark datasets D1 and D3. (a) and (g) display the original images, while (b) and (h) present results for
56 | Gloria, (c) and (i) for MTF with MA, (d) and (j) for CAF, (e) and (k) for MTTU-Net, and (f) and (l) for our proposed DRIFA-Net.
57 |
58 |
59 | 
60 |
61 | Figure 5. T-SNE visualization of different models applied to the dermoscopy images of the D1 dataset, where (a) represents the T-SNE visualization of Gloria, (b) of MTTU-Net, and (c) of our proposed DRIFA-Net.
62 |
63 |
64 | ### Citation:
65 |
66 | If you find this work useful, please cite:
67 | ```bibtex
68 | @inproceedings{dhar2025multimodal,
69 | title={Multimodal Fusion Learning with Dual Attention for Medical Imaging},
70 | author={Dhar, Joy and Zaidi, N. and Haghighat, M. and Goyal, P. and Roy, S. and Alavi, A. and Kumar, V.},
71 | booktitle={IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)},
72 | year={2025},
73 | url={https://arxiv.org/abs/2412.01248}
74 | }
75 |
76 |
77 |
78 |
79 |
80 |
81 |
82 |
--------------------------------------------------------------------------------
/d1-dataset-mri-and-d2-dataset-ct-scan.ipynb:
--------------------------------------------------------------------------------
1 | {"metadata":{"kernelspec":{"name":"python3","display_name":"Python 3","language":"python"},"language_info":{"name":"python","version":"3.10.14","mimetype":"text/x-python","codemirror_mode":{"name":"ipython","version":3},"pygments_lexer":"ipython3","nbconvert_exporter":"python","file_extension":".py"},"kaggle":{"accelerator":"gpu","dataSources":[{"sourceId":1183191,"sourceType":"datasetVersion","datasetId":672399},{"sourceId":2645886,"sourceType":"datasetVersion","datasetId":1608934}],"dockerImageVersionId":30787,"isInternetEnabled":true,"language":"python","sourceType":"notebook","isGpuEnabled":true}},"nbformat_minor":4,"nbformat":4,"cells":[{"cell_type":"markdown","source":"# 1. Import needed libraries","metadata":{}},{"cell_type":"code","source":"import os\nfrom PIL import Image\nimport numpy as np\nimport pandas as pd\nimport matplotlib.pyplot as plt\nimport seaborn as sns\nfrom glob import glob\n#---------------------------------------\nfrom sklearn.model_selection import train_test_split\nfrom sklearn.metrics import classification_report, confusion_matrix\n#---------------------------------------\nimport tensorflow as tf\nfrom tensorflow.keras.models import Sequential\nfrom tensorflow.keras.layers import Dense, Dropout, Flatten\nfrom tensorflow.keras.optimizers import Adamax\nfrom tensorflow.keras.metrics import Precision, Recall\nfrom tensorflow.keras.preprocessing.image import ImageDataGenerator\n#---------------------------------------\nimport warnings\nwarnings.filterwarnings(\"ignore\")\n\nimport os\nfrom PIL import Image\nimport numpy as np\nimport pandas as pd\nimport matplotlib.pyplot as plt\nimport seaborn as sns\nfrom glob import glob\n#---------------------------------------\nfrom sklearn.model_selection import train_test_split\nfrom sklearn.metrics import classification_report, confusion_matrix\n#---------------------------------------\nimport tensorflow as tf\nfrom tensorflow.keras.models import Sequential\nfrom tensorflow.keras.layers import Dense, Dropout, Flatten\nfrom tensorflow.keras.optimizers import Adamax\nfrom tensorflow.keras.metrics import Precision, Recall\nfrom tensorflow.keras.preprocessing.image import ImageDataGenerator\n#---------------------------------------\nimport warnings\nwarnings.filterwarnings(\"ignore\")\n\nimg_rows, img_cols = 128, 128\ninput_shape = (img_rows, img_cols, 3)\n\n#n_classes = df['category'].nunique()\nn_classes = 4\nprint('Total number of unique categories:', n_classes)\n\nfrom os import listdir, makedirs\nfrom os.path import isfile, join, basename, splitext, isfile, exists\n\nimport numpy as np\nimport pandas as pd\n\nfrom tqdm import tqdm_notebook\n\nimport tensorflow as tf\nimport keras.backend as K\n\nimport keras\nfrom keras.models import Sequential, Model\nfrom keras.layers import Dropout, Dense, Flatten, BatchNormalization\nfrom keras.layers import DepthwiseConv2D, SeparableConvolution2D, Convolution2D, Conv2D,GRU, LSTM, AlphaDropout, Embedding, ZeroPadding2D,AveragePooling2D, MaxPooling2D, GlobalAveragePooling2D, GlobalMaxPooling2D, Dropout\nfrom keras.layers import Concatenate, Average, Maximum, Bidirectional, TimeDistributed\nfrom keras.callbacks import Callback, EarlyStopping, ModelCheckpoint\n#from keras.engine.input_layer import Input\nfrom keras.models import load_model\n#from keras.initializers import LecunNormal\n\nimport matplotlib.pyplot as plt\nimport seaborn as sns\n\n#pd.set_option('precision', 30)\nnp.set_printoptions(precision = 30)\n\n\n#tf.set_random_seed(1090)\n\nimport pandas as pd\nimport numpy as np\n\nimport seaborn as sns\nimport matplotlib.pyplot as plt\nimport matplotlib.image as img\n\nimport cv2\nimport itertools\nimport pathlib\nimport warnings\nfrom PIL import Image\nfrom random import randint\nwarnings.filterwarnings('ignore')\n\nfrom imblearn.over_sampling import SMOTE\nfrom sklearn.model_selection import train_test_split\nfrom sklearn.metrics import matthews_corrcoef as MCC\nfrom sklearn.metrics import balanced_accuracy_score as BAS\nfrom sklearn.metrics import classification_report, confusion_matrix\n\n\nfrom tensorflow import keras\nfrom keras import layers\nimport tensorflow as tf\n#import tensorflow_addons as tfa\nfrom tensorflow.keras.preprocessing import image_dataset_from_directory\n##from keras.utils.vis_utils import plot_model\nfrom tensorflow.keras import Sequential, Input\nfrom tensorflow.keras.layers import Dense, Dropout\nfrom tensorflow.keras.layers import Conv2D, Flatten\nfrom tensorflow.keras.callbacks import ReduceLROnPlateau\nfrom tensorflow.keras.applications.inception_v3 import InceptionV3\nfrom tensorflow.keras.preprocessing.image import ImageDataGenerator as IDG\nfrom tensorflow.keras.layers import SeparableConv2D, BatchNormalization, GlobalAveragePooling2D\n\nfrom distutils.dir_util import copy_tree, remove_tree\n\nimport os\n#print(os.listdir(\"../input/alzheimer-mri-dataset/Dataset\"))\nimport tensorflow as tf\nfrom keras.datasets import mnist\nimport cv2\nimport os\nimport pathlib\nfrom keras.layers import Conv2D, Conv2DTranspose,Concatenate, Dropout, Dense, Reshape, LayerNormalization, LeakyReLU\nfrom keras import layers, models\nimport matplotlib.pyplot as plt\nimport numpy as np\nfrom sklearn.metrics import accuracy_score, classification_report\nfrom sklearn.metrics import f1_score, recall_score, precision_score\nprint(\"TensorFlow Version:\", tf.__version__)","metadata":{"_cell_guid":"b1076dfc-b9ad-4769-8c92-a6c4dae69d19","_uuid":"8f2839f25d086af736a60e9eeb907d3b93b6e0e5","execution":{"iopub.status.busy":"2024-07-28T19:52:44.874456Z","iopub.execute_input":"2024-07-28T19:52:44.875406Z","iopub.status.idle":"2024-07-28T19:52:56.032164Z","shell.execute_reply.started":"2024-07-28T19:52:44.875365Z","shell.execute_reply":"2024-07-28T19:52:56.031161Z"},"trusted":true},"outputs":[{"name":"stderr","text":"2024-07-28 19:52:48.776203: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered\n2024-07-28 19:52:48.776341: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered\n2024-07-28 19:52:48.909666: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered\n","output_type":"stream"},{"name":"stdout","text":"Total number of unique categories: 4\nTensorFlow Version: 2.15.0\n","output_type":"stream"}],"execution_count":1},{"cell_type":"code","source":"","metadata":{},"outputs":[],"execution_count":null},{"cell_type":"markdown","source":"# 2. Preprocessing","metadata":{}},{"cell_type":"markdown","source":"## 2.1 Load data","metadata":{}},{"cell_type":"code","source":"def train_df(tr_path):\n classes, class_paths = zip(*[(label, os.path.join(tr_path, label, image))\n for label in os.listdir(tr_path) if os.path.isdir(os.path.join(tr_path, label))\n for image in os.listdir(os.path.join(tr_path, label))])\n\n tr_df = pd.DataFrame({'Class Path': class_paths, 'Class': classes})\n return tr_df","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:44:24.370880Z","iopub.execute_input":"2024-07-28T12:44:24.371245Z","iopub.status.idle":"2024-07-28T12:44:24.377523Z","shell.execute_reply.started":"2024-07-28T12:44:24.371214Z","shell.execute_reply":"2024-07-28T12:44:24.376355Z"},"trusted":true},"outputs":[],"execution_count":3},{"cell_type":"code","source":"def test_df(ts_path):\n classes, class_paths = zip(*[(label, os.path.join(ts_path, label, image))\n for label in os.listdir(ts_path) if os.path.isdir(os.path.join(ts_path, label))\n for image in os.listdir(os.path.join(ts_path, label))])\n\n ts_df = pd.DataFrame({'Class Path': class_paths, 'Class': classes})\n return ts_df","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:44:24.718610Z","iopub.execute_input":"2024-07-28T12:44:24.719460Z","iopub.status.idle":"2024-07-28T12:44:24.725054Z","shell.execute_reply.started":"2024-07-28T12:44:24.719421Z","shell.execute_reply":"2024-07-28T12:44:24.724083Z"},"trusted":true},"outputs":[],"execution_count":4},{"cell_type":"code","source":"tr_df = train_df('/kaggle/input/brain-tumor-mri-dataset/Training')","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:44:24.973845Z","iopub.execute_input":"2024-07-28T12:44:24.974205Z","iopub.status.idle":"2024-07-28T12:44:25.800440Z","shell.execute_reply.started":"2024-07-28T12:44:24.974175Z","shell.execute_reply":"2024-07-28T12:44:25.799605Z"},"trusted":true},"outputs":[],"execution_count":5},{"cell_type":"code","source":"tr_df","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:44:25.802198Z","iopub.execute_input":"2024-07-28T12:44:25.802878Z","iopub.status.idle":"2024-07-28T12:44:25.823415Z","shell.execute_reply.started":"2024-07-28T12:44:25.802840Z","shell.execute_reply":"2024-07-28T12:44:25.822519Z"},"trusted":true},"outputs":[{"execution_count":6,"output_type":"execute_result","data":{"text/plain":" Class Path Class\n0 /kaggle/input/brain-tumor-mri-dataset/Training... pituitary\n1 /kaggle/input/brain-tumor-mri-dataset/Training... pituitary\n2 /kaggle/input/brain-tumor-mri-dataset/Training... pituitary\n3 /kaggle/input/brain-tumor-mri-dataset/Training... pituitary\n4 /kaggle/input/brain-tumor-mri-dataset/Training... pituitary\n... ... ...\n5707 /kaggle/input/brain-tumor-mri-dataset/Training... glioma\n5708 /kaggle/input/brain-tumor-mri-dataset/Training... glioma\n5709 /kaggle/input/brain-tumor-mri-dataset/Training... glioma\n5710 /kaggle/input/brain-tumor-mri-dataset/Training... glioma\n5711 /kaggle/input/brain-tumor-mri-dataset/Training... glioma\n\n[5712 rows x 2 columns]","text/html":"
\n\n
\n \n \n \n Class Path \n Class \n \n \n \n \n 0 \n /kaggle/input/brain-tumor-mri-dataset/Training... \n pituitary \n \n \n 1 \n /kaggle/input/brain-tumor-mri-dataset/Training... \n pituitary \n \n \n 2 \n /kaggle/input/brain-tumor-mri-dataset/Training... \n pituitary \n \n \n 3 \n /kaggle/input/brain-tumor-mri-dataset/Training... \n pituitary \n \n \n 4 \n /kaggle/input/brain-tumor-mri-dataset/Training... \n pituitary \n \n \n ... \n ... \n ... \n \n \n 5707 \n /kaggle/input/brain-tumor-mri-dataset/Training... \n glioma \n \n \n 5708 \n /kaggle/input/brain-tumor-mri-dataset/Training... \n glioma \n \n \n 5709 \n /kaggle/input/brain-tumor-mri-dataset/Training... \n glioma \n \n \n 5710 \n /kaggle/input/brain-tumor-mri-dataset/Training... \n glioma \n \n \n 5711 \n /kaggle/input/brain-tumor-mri-dataset/Training... \n glioma \n \n \n
\n
5712 rows × 2 columns
\n
"},"metadata":{}}],"execution_count":6},{"cell_type":"code","source":"ts_df = test_df('/kaggle/input/brain-tumor-mri-dataset/Testing')","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:44:25.824615Z","iopub.execute_input":"2024-07-28T12:44:25.824969Z","iopub.status.idle":"2024-07-28T12:44:26.048128Z","shell.execute_reply.started":"2024-07-28T12:44:25.824936Z","shell.execute_reply":"2024-07-28T12:44:26.047317Z"},"trusted":true},"outputs":[],"execution_count":7},{"cell_type":"code","source":"ts_df","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:44:26.050134Z","iopub.execute_input":"2024-07-28T12:44:26.050473Z","iopub.status.idle":"2024-07-28T12:44:26.061200Z","shell.execute_reply.started":"2024-07-28T12:44:26.050444Z","shell.execute_reply":"2024-07-28T12:44:26.060152Z"},"trusted":true},"outputs":[{"execution_count":8,"output_type":"execute_result","data":{"text/plain":" Class Path Class\n0 /kaggle/input/brain-tumor-mri-dataset/Testing/... pituitary\n1 /kaggle/input/brain-tumor-mri-dataset/Testing/... pituitary\n2 /kaggle/input/brain-tumor-mri-dataset/Testing/... pituitary\n3 /kaggle/input/brain-tumor-mri-dataset/Testing/... pituitary\n4 /kaggle/input/brain-tumor-mri-dataset/Testing/... pituitary\n... ... ...\n1306 /kaggle/input/brain-tumor-mri-dataset/Testing/... glioma\n1307 /kaggle/input/brain-tumor-mri-dataset/Testing/... glioma\n1308 /kaggle/input/brain-tumor-mri-dataset/Testing/... glioma\n1309 /kaggle/input/brain-tumor-mri-dataset/Testing/... glioma\n1310 /kaggle/input/brain-tumor-mri-dataset/Testing/... glioma\n\n[1311 rows x 2 columns]","text/html":"\n\n
\n \n \n \n Class Path \n Class \n \n \n \n \n 0 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n pituitary \n \n \n 1 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n pituitary \n \n \n 2 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n pituitary \n \n \n 3 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n pituitary \n \n \n 4 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n pituitary \n \n \n ... \n ... \n ... \n \n \n 1306 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n glioma \n \n \n 1307 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n glioma \n \n \n 1308 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n glioma \n \n \n 1309 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n glioma \n \n \n 1310 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n glioma \n \n \n
\n
1311 rows × 2 columns
\n
"},"metadata":{}}],"execution_count":8},{"cell_type":"code","source":"# Count of images in each class in train data\nplt.figure(figsize=(15,7))\nax = sns.countplot(data=tr_df , y=tr_df['Class'])\n\nplt.xlabel('')\nplt.ylabel('')\nplt.title('Count of images in each class', fontsize=20)\nax.bar_label(ax.containers[0])\nplt.show()","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:44:26.062338Z","iopub.execute_input":"2024-07-28T12:44:26.062615Z","iopub.status.idle":"2024-07-28T12:44:26.386783Z","shell.execute_reply.started":"2024-07-28T12:44:26.062592Z","shell.execute_reply":"2024-07-28T12:44:26.385815Z"},"trusted":true},"outputs":[{"output_type":"display_data","data":{"text/plain":"","image/png":""},"metadata":{}}],"execution_count":9},{"cell_type":"code","source":"#Count each class in test data\nplt.figure(figsize=(15, 7))\nax = sns.countplot(y=ts_df['Class'], palette='viridis')\n\nax.set(xlabel='', ylabel='', title='Count of images in each class')\nax.bar_label(ax.containers[0])\n\nplt.show()","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:44:26.388404Z","iopub.execute_input":"2024-07-28T12:44:26.388715Z","iopub.status.idle":"2024-07-28T12:44:26.662331Z","shell.execute_reply.started":"2024-07-28T12:44:26.388689Z","shell.execute_reply":"2024-07-28T12:44:26.661435Z"},"trusted":true},"outputs":[{"output_type":"display_data","data":{"text/plain":"","image/png":""},"metadata":{}}],"execution_count":10},{"cell_type":"markdown","source":"## 2.2 Split data into train, test, valid","metadata":{}},{"cell_type":"code","source":"valid_df, ts_df = train_test_split(ts_df, train_size=0.5, random_state=20, stratify=ts_df['Class'])","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:44:26.664286Z","iopub.execute_input":"2024-07-28T12:44:26.664748Z","iopub.status.idle":"2024-07-28T12:44:26.675186Z","shell.execute_reply.started":"2024-07-28T12:44:26.664714Z","shell.execute_reply":"2024-07-28T12:44:26.674321Z"},"trusted":true},"outputs":[],"execution_count":11},{"cell_type":"code","source":"valid_df","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:44:26.687435Z","iopub.execute_input":"2024-07-28T12:44:26.687712Z","iopub.status.idle":"2024-07-28T12:44:26.697848Z","shell.execute_reply.started":"2024-07-28T12:44:26.687689Z","shell.execute_reply":"2024-07-28T12:44:26.696861Z"},"trusted":true},"outputs":[{"execution_count":12,"output_type":"execute_result","data":{"text/plain":" Class Path Class\n1297 /kaggle/input/brain-tumor-mri-dataset/Testing/... glioma\n723 /kaggle/input/brain-tumor-mri-dataset/Testing/... meningioma\n61 /kaggle/input/brain-tumor-mri-dataset/Testing/... pituitary\n778 /kaggle/input/brain-tumor-mri-dataset/Testing/... meningioma\n1120 /kaggle/input/brain-tumor-mri-dataset/Testing/... glioma\n... ... ...\n1070 /kaggle/input/brain-tumor-mri-dataset/Testing/... glioma\n554 /kaggle/input/brain-tumor-mri-dataset/Testing/... notumor\n1284 /kaggle/input/brain-tumor-mri-dataset/Testing/... glioma\n899 /kaggle/input/brain-tumor-mri-dataset/Testing/... meningioma\n626 /kaggle/input/brain-tumor-mri-dataset/Testing/... notumor\n\n[655 rows x 2 columns]","text/html":"\n\n
\n \n \n \n Class Path \n Class \n \n \n \n \n 1297 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n glioma \n \n \n 723 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n meningioma \n \n \n 61 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n pituitary \n \n \n 778 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n meningioma \n \n \n 1120 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n glioma \n \n \n ... \n ... \n ... \n \n \n 1070 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n glioma \n \n \n 554 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n notumor \n \n \n 1284 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n glioma \n \n \n 899 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n meningioma \n \n \n 626 \n /kaggle/input/brain-tumor-mri-dataset/Testing/... \n notumor \n \n \n
\n
655 rows × 2 columns
\n
"},"metadata":{}}],"execution_count":12},{"cell_type":"markdown","source":"## 2.3 Data preprocessing","metadata":{}},{"cell_type":"code","source":"batch_size = 32\nimg_size = (128, 128)\n\n_gen = ImageDataGenerator(rescale=1/255,\n brightness_range=(0.8, 1.2))\n\nts_gen = ImageDataGenerator(rescale=1/255)\n\n\ntr_gen = _gen.flow_from_dataframe(tr_df, x_col='Class Path',\n y_col='Class', batch_size=5712,\n target_size=img_size)\n\nvalid_gen = _gen.flow_from_dataframe(valid_df, x_col='Class Path',\n y_col='Class', batch_size=655,\n target_size=img_size)\n\nts_gen = ts_gen.flow_from_dataframe(ts_df, x_col='Class Path',\n y_col='Class', batch_size=656,\n target_size=img_size, shuffle=False)","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:44:27.150148Z","iopub.execute_input":"2024-07-28T12:44:27.150994Z","iopub.status.idle":"2024-07-28T12:44:31.743371Z","shell.execute_reply.started":"2024-07-28T12:44:27.150964Z","shell.execute_reply":"2024-07-28T12:44:31.742454Z"},"trusted":true},"outputs":[{"name":"stdout","text":"Found 5712 validated image filenames belonging to 4 classes.\nFound 655 validated image filenames belonging to 4 classes.\nFound 656 validated image filenames belonging to 4 classes.\n","output_type":"stream"}],"execution_count":13},{"cell_type":"markdown","source":"## 2.4 Getting samples from data","metadata":{}},{"cell_type":"code","source":"X_train, y_train = next(tr_gen)\nX_train.shape, y_train.shape","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:44:31.745113Z","iopub.execute_input":"2024-07-28T12:44:31.745810Z","iopub.status.idle":"2024-07-28T12:45:01.160185Z","shell.execute_reply.started":"2024-07-28T12:44:31.745773Z","shell.execute_reply":"2024-07-28T12:45:01.159309Z"},"trusted":true},"outputs":[{"execution_count":14,"output_type":"execute_result","data":{"text/plain":"((5712, 128, 128, 3), (5712, 4))"},"metadata":{}}],"execution_count":14},{"cell_type":"code","source":"class ReadDataset:\n def __init__(self, datasetpath, labels, image_shape):\n self.datasetpath = datasetpath\n self.labels = labels\n self.image_shape = image_shape\n def returListImages(self,):\n self.images = []\n for label in self.labels:\n self.images.append(list(pathlib.Path(os.path.join(self.datasetpath,\n label)).glob('*.*')))\n def readImages(self,):\n self.returListImages()\n self.finalImages = []\n labels = []\n for label in range(len(self.labels)):\n for img in self.images[label]:\n img = cv2.imread(str(img))\n img = cv2.resize(img , self.image_shape)\n img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)\n img = img/255\n self.finalImages.append(img)\n labels.append(label)\n images = np.array(self.finalImages)\n labels = np.array(labels)\n return images, labels\nimport os\nimport pathlib\nreadDatasetObject = ReadDataset('/kaggle/input/the-iqothnccd-lung-cancer-dataset/The IQ-OTHNCCD lung cancer dataset',\n ['Bengin cases', 'Malignant cases', 'Normal cases'],\n (128,128))\nimages_train_covid_cxr, labels_train_covid_cxr = readDatasetObject.readImages()\nprint(images_train_covid_cxr.shape, labels_train_covid_cxr.shape)\n\nfrom sklearn.model_selection import train_test_split\n\nX_train_covid_cxr, X_test_covid_cxr, y_train_covid_cxr, y_test_covid_cxr = train_test_split(\n images_train_covid_cxr, labels_train_covid_cxr, test_size=0.3, random_state=42)\n\nprint(X_train_covid_cxr.shape, X_test_covid_cxr.shape, y_train_covid_cxr.shape, y_test_covid_cxr.shape)\n\nfrom sklearn.model_selection import train_test_split\n\nX_test_covid_cxr, X_val_covid_cxr, y_test_covid_cxr, y_val_covid_cxr = train_test_split(\n X_test_covid_cxr, y_test_covid_cxr, test_size=0.5, random_state=42)\n\nX_test_covid_cxr.shape, X_val_covid_cxr.shape, y_test_covid_cxr.shape, y_val_covid_cxr.shape","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:45:01.161627Z","iopub.execute_input":"2024-07-28T12:45:01.161922Z","iopub.status.idle":"2024-07-28T12:45:14.557137Z","shell.execute_reply.started":"2024-07-28T12:45:01.161897Z","shell.execute_reply":"2024-07-28T12:45:14.556237Z"},"trusted":true},"outputs":[{"name":"stdout","text":"(1097, 128, 128, 3) (1097,)\n(767, 128, 128, 3) (330, 128, 128, 3) (767,) (330,)\n","output_type":"stream"},{"execution_count":15,"output_type":"execute_result","data":{"text/plain":"((165, 128, 128, 3), (165, 128, 128, 3), (165,), (165,))"},"metadata":{}}],"execution_count":15},{"cell_type":"code","source":"","metadata":{},"outputs":[],"execution_count":null},{"cell_type":"code","source":"'''y_train_class_indices = y_train_covid_cxr\n\n# Map class indices\ny_train_mapped_indices = y_train_class_indices + 4\n\n# Convert back to one-hot encoding for training (if needed)\ny_train_mapped_one_hot = tf.keras.utils.to_categorical(y_train_mapped_indices)\n\n# Print the first 10 one-hot encoded labels to verify\nprint(\"One-hot encoded mapped labels (first 10):\", y_train_mapped_one_hot.shape)\ny_train_mapped_indices = np.array(y_train_mapped_indices)\ny_train_mapped_series = pd.Series(y_train_mapped_indices)\n\n# Use value_counts to count unique values\nvalue_counts = y_train_mapped_series.value_counts()\n\n# Print the value counts\nprint(value_counts)\n\ny_train1 = np.argmax(y_train, axis=1)\nprint(y_train1.shape)\n\nconcatenated_labels = np.concatenate((y_train1, y_train_mapped_indices))\nprint(concatenated_labels.shape)\n\nconcatenated_images = np.concatenate((X_train, X_train_covid_cxr))\nconcatenated_images.shape'''","metadata":{"execution":{"iopub.status.busy":"2024-12-01T13:59:56.653026Z","iopub.execute_input":"2024-12-01T13:59:56.653538Z","iopub.status.idle":"2024-12-01T13:59:56.663263Z","shell.execute_reply.started":"2024-12-01T13:59:56.653493Z","shell.execute_reply":"2024-12-01T13:59:56.662570Z"},"trusted":true},"outputs":[{"execution_count":1,"output_type":"execute_result","data":{"text/plain":"'y_train_class_indices = y_train_covid_cxr\\n\\n# Map class indices\\ny_train_mapped_indices = y_train_class_indices + 4\\n\\n# Convert back to one-hot encoding for training (if needed)\\ny_train_mapped_one_hot = tf.keras.utils.to_categorical(y_train_mapped_indices)\\n\\n# Print the first 10 one-hot encoded labels to verify\\nprint(\"One-hot encoded mapped labels (first 10):\", y_train_mapped_one_hot.shape)\\ny_train_mapped_indices = np.array(y_train_mapped_indices)\\ny_train_mapped_series = pd.Series(y_train_mapped_indices)\\n\\n# Use value_counts to count unique values\\nvalue_counts = y_train_mapped_series.value_counts()\\n\\n# Print the value counts\\nprint(value_counts)\\n\\ny_train1 = np.argmax(y_train, axis=1)\\nprint(y_train1.shape)\\n\\nconcatenated_labels = np.concatenate((y_train1, y_train_mapped_indices))\\nprint(concatenated_labels.shape)\\n\\nconcatenated_images = np.concatenate((X_train, X_train_covid_cxr))\\nconcatenated_images.shape'"},"metadata":{}}],"execution_count":1},{"cell_type":"code","source":"'''random_indices = np.random.choice(6479, 6478, replace=False)\nconcatenated_images = concatenated_images[random_indices]\nconcatenated_labels = concatenated_labels[random_indices]\nconcatenated_images.shape, concatenated_labels.shape'''","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:45:15.273605Z","iopub.execute_input":"2024-07-28T12:45:15.273975Z","iopub.status.idle":"2024-07-28T12:45:16.025240Z","shell.execute_reply.started":"2024-07-28T12:45:15.273943Z","shell.execute_reply":"2024-07-28T12:45:16.024292Z"},"trusted":true},"outputs":[{"execution_count":17,"output_type":"execute_result","data":{"text/plain":"((6478, 128, 128, 3), (6478,))"},"metadata":{}}],"execution_count":17},{"cell_type":"code","source":"'''import numpy as np\nimport cv2\n\ndef rotate_image(image, angle):\n \"\"\"\n Rotate the image by the specified angle.\n \"\"\"\n center = tuple(np.array(image.shape[1::-1]) / 2)\n rotation_matrix = cv2.getRotationMatrix2D(center, angle, 1.0)\n rotated_image = cv2.warpAffine(image, rotation_matrix, image.shape[1::-1], flags=cv2.INTER_LINEAR)\n return rotated_image\n\ndef translate_image(image, tx, ty):\n \"\"\"\n Translate the image by the specified translation parameters.\n \"\"\"\n translation_matrix = np.float32([[1, 0, tx], [0, 1, ty]])\n translated_image = cv2.warpAffine(image, translation_matrix, image.shape[1::-1])\n return translated_image\n\n# Example data\n#X_train = np.random.rand(100, 28, 28) # Assuming 100 images of size 28x28\n#y_train = np.random.randint(0, 10, 100) # Assuming 100 labels\n\n# Augmentation parameters\nrotation_angles = [5]\ntranslations = [(5, 5)]\n\naugmented_X_train = []\naugmented_y_train = []\n\nfor image, label in zip(X_train, y_train):\n # Original image\n augmented_X_train.append(image)\n augmented_y_train.append(label)\n\n # Augment with rotations\n for angle in rotation_angles:\n rotated_image = rotate_image(image, angle)\n augmented_X_train.append(rotated_image)\n augmented_y_train.append(label)\n\n # Augment with translations\n for tx, ty in translations:\n translated_image = translate_image(image, tx, ty)\n augmented_X_train.append(translated_image)\n augmented_y_train.append(label)\n\n# Convert lists to numpy arrays\naugmented_X_train = np.array(augmented_X_train)\naugmented_y_train = np.array(augmented_y_train)\n\n# Shuffle the data\nshuffle_indices = np.random.permutation(len(augmented_X_train))\naugmented_X_train = augmented_X_train[shuffle_indices]\naugmented_y_train = augmented_y_train[shuffle_indices]\naugmented_X_train.shape, augmented_y_train.shape\n# Now, augmented_X_train and augmented_y_train contain the augmented dataset.'''","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:45:16.026248Z","iopub.execute_input":"2024-07-28T12:45:16.026553Z","iopub.status.idle":"2024-07-28T12:45:16.034622Z","shell.execute_reply.started":"2024-07-28T12:45:16.026528Z","shell.execute_reply":"2024-07-28T12:45:16.033754Z"},"trusted":true},"outputs":[{"execution_count":18,"output_type":"execute_result","data":{"text/plain":"'import numpy as np\\nimport cv2\\n\\ndef rotate_image(image, angle):\\n \"\"\"\\n Rotate the image by the specified angle.\\n \"\"\"\\n center = tuple(np.array(image.shape[1::-1]) / 2)\\n rotation_matrix = cv2.getRotationMatrix2D(center, angle, 1.0)\\n rotated_image = cv2.warpAffine(image, rotation_matrix, image.shape[1::-1], flags=cv2.INTER_LINEAR)\\n return rotated_image\\n\\ndef translate_image(image, tx, ty):\\n \"\"\"\\n Translate the image by the specified translation parameters.\\n \"\"\"\\n translation_matrix = np.float32([[1, 0, tx], [0, 1, ty]])\\n translated_image = cv2.warpAffine(image, translation_matrix, image.shape[1::-1])\\n return translated_image\\n\\n# Example data\\n#X_train = np.random.rand(100, 28, 28) # Assuming 100 images of size 28x28\\n#y_train = np.random.randint(0, 10, 100) # Assuming 100 labels\\n\\n# Augmentation parameters\\nrotation_angles = [5]\\ntranslations = [(5, 5)]\\n\\naugmented_X_train = []\\naugmented_y_train = []\\n\\nfor image, label in zip(X_train, y_train):\\n # Original image\\n augmented_X_train.append(image)\\n augmented_y_train.append(label)\\n\\n # Augment with rotations\\n for angle in rotation_angles:\\n rotated_image = rotate_image(image, angle)\\n augmented_X_train.append(rotated_image)\\n augmented_y_train.append(label)\\n\\n # Augment with translations\\n for tx, ty in translations:\\n translated_image = translate_image(image, tx, ty)\\n augmented_X_train.append(translated_image)\\n augmented_y_train.append(label)\\n\\n# Convert lists to numpy arrays\\naugmented_X_train = np.array(augmented_X_train)\\naugmented_y_train = np.array(augmented_y_train)\\n\\n# Shuffle the data\\nshuffle_indices = np.random.permutation(len(augmented_X_train))\\naugmented_X_train = augmented_X_train[shuffle_indices]\\naugmented_y_train = augmented_y_train[shuffle_indices]\\naugmented_X_train.shape, augmented_y_train.shape\\n# Now, augmented_X_train and augmented_y_train contain the augmented dataset.'"},"metadata":{}}],"execution_count":18},{"cell_type":"code","source":"random_indices = np.random.choice(5712, 766, replace=False)\naugmented_X_train = X_train[random_indices]\naugmented_y_train = y_train[random_indices]\naugmented_X_train.shape, augmented_y_train.shape","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:45:16.035757Z","iopub.execute_input":"2024-07-28T12:45:16.036054Z","iopub.status.idle":"2024-07-28T12:45:16.094678Z","shell.execute_reply.started":"2024-07-28T12:45:16.036031Z","shell.execute_reply":"2024-07-28T12:45:16.093736Z"},"trusted":true},"outputs":[{"execution_count":19,"output_type":"execute_result","data":{"text/plain":"((766, 128, 128, 3), (766, 4))"},"metadata":{}}],"execution_count":19},{"cell_type":"code","source":"#X_train_covid_cxr.shape, X_test_covid_cxr.shape, y_train_covid_cxr.shape, y_test_covid_cxr.shape\n\ny_train = np.concatenate((y_train,augmented_y_train), axis=0)\nX_train = np.concatenate((X_train, augmented_X_train), axis=0)\nX_train.shape, y_train.shape","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:45:16.096011Z","iopub.execute_input":"2024-07-28T12:45:16.096659Z","iopub.status.idle":"2024-07-28T12:45:16.614766Z","shell.execute_reply.started":"2024-07-28T12:45:16.096622Z","shell.execute_reply":"2024-07-28T12:45:16.613870Z"},"trusted":true},"outputs":[{"execution_count":20,"output_type":"execute_result","data":{"text/plain":"((6478, 128, 128, 3), (6478, 4))"},"metadata":{}}],"execution_count":20},{"cell_type":"code","source":"import numpy as np\nimport cv2\n\ndef rotate_image(image, angle):\n \"\"\"\n Rotate the image by the specified angle.\n \"\"\"\n center = tuple(np.array(image.shape[1::-1]) / 2)\n rotation_matrix = cv2.getRotationMatrix2D(center, angle, 1.0)\n rotated_image = cv2.warpAffine(image, rotation_matrix, image.shape[1::-1], flags=cv2.INTER_LINEAR)\n return rotated_image\n\ndef translate_image(image, tx, ty):\n \"\"\"\n Translate the image by the specified translation parameters.\n \"\"\"\n translation_matrix = np.float32([[1, 0, tx], [0, 1, ty]])\n translated_image = cv2.warpAffine(image, translation_matrix, image.shape[1::-1])\n return translated_image\n\n# Example data\n#X_train = np.random.rand(100, 28, 28) # Assuming 100 images of size 28x28\n#y_train = np.random.randint(0, 10, 100) # Assuming 100 labels\n\n# Augmentation parameters\nrotation_angles = [5]\ntranslations = [(5, 5)]\n\naugmented_X_train = []\naugmented_y_train = []\n\nfor image, label in zip(X_train_covid_cxr, y_train_covid_cxr):\n # Original image\n augmented_X_train.append(image)\n augmented_y_train.append(label)\n\n # Augment with rotations\n for angle in rotation_angles:\n rotated_image = rotate_image(image, angle)\n augmented_X_train.append(rotated_image)\n augmented_y_train.append(label)\n\n # Augment with translations\n for tx, ty in translations:\n translated_image = translate_image(image, tx, ty)\n augmented_X_train.append(translated_image)\n augmented_y_train.append(label)\n\n# Convert lists to numpy arrays\naugmented_X_train = np.array(augmented_X_train)\naugmented_y_train = np.array(augmented_y_train)\n\n# Shuffle the data\nshuffle_indices = np.random.permutation(len(augmented_X_train))\naugmented_X_train = augmented_X_train[shuffle_indices]\naugmented_y_train = augmented_y_train[shuffle_indices]\naugmented_X_train.shape, augmented_y_train.shape\n# Now, augmented_X_train and augmented_y_train contain the augmented dataset.","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:45:16.616058Z","iopub.execute_input":"2024-07-28T12:45:16.616438Z","iopub.status.idle":"2024-07-28T12:45:17.888485Z","shell.execute_reply.started":"2024-07-28T12:45:16.616404Z","shell.execute_reply":"2024-07-28T12:45:17.887493Z"},"trusted":true},"outputs":[{"execution_count":21,"output_type":"execute_result","data":{"text/plain":"((2301, 128, 128, 3), (2301,))"},"metadata":{}}],"execution_count":21},{"cell_type":"code","source":"#X_train_covid_cxr.shape, X_test_covid_cxr.shape, y_train_covid_cxr.shape, y_test_covid_cxr.shape\n\nlabels_train_covid_cxr = np.concatenate((augmented_y_train,augmented_y_train, augmented_y_train), axis=0)\nimages_train_covid_cxr = np.concatenate((augmented_X_train, augmented_X_train, augmented_X_train), axis=0)\nimages_train_covid_cxr.shape, labels_train_covid_cxr.shape\n\n","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:45:17.892639Z","iopub.execute_input":"2024-07-28T12:45:17.892948Z","iopub.status.idle":"2024-07-28T12:45:18.870631Z","shell.execute_reply.started":"2024-07-28T12:45:17.892921Z","shell.execute_reply":"2024-07-28T12:45:18.869600Z"},"trusted":true},"outputs":[{"execution_count":22,"output_type":"execute_result","data":{"text/plain":"((6903, 128, 128, 3), (6903,))"},"metadata":{}}],"execution_count":22},{"cell_type":"code","source":"random_indices = np.random.choice(6903, 6478, replace=False)\nimages_train_covid_cxr = images_train_covid_cxr[random_indices]\nlabels_train_covid_cxr = labels_train_covid_cxr[random_indices]\nimages_train_covid_cxr.shape, labels_train_covid_cxr.shape","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:45:18.871833Z","iopub.execute_input":"2024-07-28T12:45:18.872130Z","iopub.status.idle":"2024-07-28T12:45:19.616245Z","shell.execute_reply.started":"2024-07-28T12:45:18.872105Z","shell.execute_reply":"2024-07-28T12:45:19.615456Z"},"trusted":true},"outputs":[{"execution_count":23,"output_type":"execute_result","data":{"text/plain":"((6478, 128, 128, 3), (6478,))"},"metadata":{}}],"execution_count":23},{"cell_type":"code","source":"X_val, y_val = next(valid_gen)\nX_val.shape, y_val.shape","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:45:19.617579Z","iopub.execute_input":"2024-07-28T12:45:19.617952Z","iopub.status.idle":"2024-07-28T12:45:22.853226Z","shell.execute_reply.started":"2024-07-28T12:45:19.617918Z","shell.execute_reply":"2024-07-28T12:45:22.852312Z"},"trusted":true},"outputs":[{"execution_count":24,"output_type":"execute_result","data":{"text/plain":"((655, 128, 128, 3), (655, 4))"},"metadata":{}}],"execution_count":24},{"cell_type":"code","source":"","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"random_indices = np.random.choice(820, 800, replace=False)\nconcatenated_val_images1 = concatenated_val_images[random_indices]\nconcatenated_val_labels1 = concatenated_val_labels[random_indices]\nconcatenated_val_images1.shape, concatenated_val_labels1.shape","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:45:22.917173Z","iopub.execute_input":"2024-07-28T12:45:22.917550Z","iopub.status.idle":"2024-07-28T12:45:23.014879Z","shell.execute_reply.started":"2024-07-28T12:45:22.917524Z","shell.execute_reply":"2024-07-28T12:45:23.013962Z"},"trusted":true},"outputs":[{"execution_count":26,"output_type":"execute_result","data":{"text/plain":"((800, 128, 128, 3), (800, 7))"},"metadata":{}}],"execution_count":26},{"cell_type":"code","source":"#X_train_covid_cxr.shape, X_test_covid_cxr.shape, y_train_covid_cxr.shape, y_test_covid_cxr.shape\n\nconcatenated_val_labels = np.concatenate((concatenated_val_labels, concatenated_val_labels1), axis=0)\nconcatenated_val_images = np.concatenate((concatenated_val_images, concatenated_val_images1), axis=0)\nconcatenated_val_images.shape, concatenated_val_labels.shape","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:45:23.016111Z","iopub.execute_input":"2024-07-28T12:45:23.016496Z","iopub.status.idle":"2024-07-28T12:45:23.262223Z","shell.execute_reply.started":"2024-07-28T12:45:23.016463Z","shell.execute_reply":"2024-07-28T12:45:23.261337Z"},"trusted":true},"outputs":[{"execution_count":27,"output_type":"execute_result","data":{"text/plain":"((1620, 128, 128, 3), (1620, 7))"},"metadata":{}}],"execution_count":27},{"cell_type":"code","source":"#X_train_covid_cxr.shape, X_test_covid_cxr.shape, y_train_covid_cxr.shape, y_test_covid_cxr.shape\n\nX_val = np.concatenate((X_val, X_val, X_val), axis=0)\ny_val = np.concatenate((y_val, y_val, y_val), axis=0)\nX_val.shape, y_val.shape","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:45:23.263535Z","iopub.execute_input":"2024-07-28T12:45:23.263835Z","iopub.status.idle":"2024-07-28T12:45:23.352803Z","shell.execute_reply.started":"2024-07-28T12:45:23.263811Z","shell.execute_reply":"2024-07-28T12:45:23.351862Z"},"trusted":true},"outputs":[{"execution_count":28,"output_type":"execute_result","data":{"text/plain":"((1965, 128, 128, 3), (1965, 4))"},"metadata":{}}],"execution_count":28},{"cell_type":"code","source":"random_indices = np.random.choice(1965, 1620, replace=False)\nX_val = X_val[random_indices]\ny_val = y_val[random_indices]\nX_val.shape, y_val.shape","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:45:23.353895Z","iopub.execute_input":"2024-07-28T12:45:23.354193Z","iopub.status.idle":"2024-07-28T12:45:23.453976Z","shell.execute_reply.started":"2024-07-28T12:45:23.354169Z","shell.execute_reply":"2024-07-28T12:45:23.453057Z"},"trusted":true},"outputs":[{"execution_count":29,"output_type":"execute_result","data":{"text/plain":"((1620, 128, 128, 3), (1620, 4))"},"metadata":{}}],"execution_count":29},{"cell_type":"code","source":"#X_val_covid_cxr\n\n#X_train_covid_cxr.shape, X_test_covid_cxr.shape, y_train_covid_cxr.shape, y_test_covid_cxr.shape\n\nX_val_covid_cxr = np.concatenate((X_val_covid_cxr, X_val_covid_cxr, X_val_covid_cxr, X_val_covid_cxr, X_val_covid_cxr), axis=0)\ny_val_covid_cxr = np.concatenate((y_val_covid_cxr, y_val_covid_cxr, y_val_covid_cxr, y_val_covid_cxr, y_val_covid_cxr), axis=0)\nX_val_covid_cxr.shape, y_val_covid_cxr.shape","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:45:23.455229Z","iopub.execute_input":"2024-07-28T12:45:23.455947Z","iopub.status.idle":"2024-07-28T12:45:23.529774Z","shell.execute_reply.started":"2024-07-28T12:45:23.455911Z","shell.execute_reply":"2024-07-28T12:45:23.528862Z"},"trusted":true},"outputs":[{"execution_count":30,"output_type":"execute_result","data":{"text/plain":"((825, 128, 128, 3), (825,))"},"metadata":{}}],"execution_count":30},{"cell_type":"code","source":"#X_val_covid_cxr\n\n#X_train_covid_cxr.shape, X_test_covid_cxr.shape, y_train_covid_cxr.shape, y_test_covid_cxr.shape\n\nX_val_covid_cxr = np.concatenate((X_val_covid_cxr, X_val_covid_cxr), axis=0)\ny_val_covid_cxr = np.concatenate((y_val_covid_cxr, y_val_covid_cxr), axis=0)\nX_val_covid_cxr.shape, y_val_covid_cxr.shape","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:45:23.531096Z","iopub.execute_input":"2024-07-28T12:45:23.531745Z","iopub.status.idle":"2024-07-28T12:45:23.789693Z","shell.execute_reply.started":"2024-07-28T12:45:23.531709Z","shell.execute_reply":"2024-07-28T12:45:23.788678Z"},"trusted":true},"outputs":[{"execution_count":31,"output_type":"execute_result","data":{"text/plain":"((1650, 128, 128, 3), (1650,))"},"metadata":{}}],"execution_count":31},{"cell_type":"code","source":"random_indices = np.random.choice(1650, 1620, replace=False)\nX_val_covid_cxr = X_val_covid_cxr[random_indices]\ny_val_covid_cxr = y_val_covid_cxr[random_indices]\nX_val_covid_cxr.shape, y_val_covid_cxr.shape","metadata":{"execution":{"iopub.status.busy":"2024-07-28T12:45:23.790715Z","iopub.execute_input":"2024-07-28T12:45:23.790975Z","iopub.status.idle":"2024-07-28T12:45:23.981638Z","shell.execute_reply.started":"2024-07-28T12:45:23.790954Z","shell.execute_reply":"2024-07-28T12:45:23.980697Z"},"trusted":true},"outputs":[{"execution_count":32,"output_type":"execute_result","data":{"text/plain":"((1620, 128, 128, 3), (1620,))"},"metadata":{}}],"execution_count":32},{"cell_type":"code","source":"","metadata":{},"outputs":[],"execution_count":null}]}
--------------------------------------------------------------------------------
/drifa-net.ipynb:
--------------------------------------------------------------------------------
1 | {"metadata":{"kernelspec":{"language":"python","display_name":"Python 3","name":"python3"},"language_info":{"name":"python","version":"3.10.14","mimetype":"text/x-python","codemirror_mode":{"name":"ipython","version":3},"pygments_lexer":"ipython3","nbconvert_exporter":"python","file_extension":".py"},"kaggle":{"accelerator":"gpu","dataSources":[],"dockerImageVersionId":30787,"isInternetEnabled":true,"language":"python","sourceType":"notebook","isGpuEnabled":true}},"nbformat_minor":4,"nbformat":4,"cells":[{"cell_type":"code","source":"import cv2\nimport seaborn as sns\nimport matplotlib.pyplot as plt\nimport numpy as np\nimport pandas as pd\nimport plotly.express as px\nsns.set_style('whitegrid')\nfrom sklearn.metrics import confusion_matrix , classification_report\nimport tensorflow as tf\nfrom tensorflow import keras\nfrom tensorflow.keras.models import Sequential\nfrom tensorflow.keras.layers import Dense , Flatten , Conv2D , MaxPooling2D , Dropout , Activation , BatchNormalization\nfrom tensorflow.keras.preprocessing.image import ImageDataGenerator\nfrom tensorflow.keras.optimizers import Adam , Adamax\nfrom tensorflow.keras import regularizers\n\n#Warnings\nimport warnings\nwarnings.filterwarnings('ignore')","metadata":{"_uuid":"8f2839f25d086af736a60e9eeb907d3b93b6e0e5","_cell_guid":"b1076dfc-b9ad-4769-8c92-a6c4dae69d19","trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"import tensorflow as tf\ntf.keras.mixed_precision.set_global_policy('mixed_float16')\n\nimport tensorflow as tf\nimport numpy as np\nimport numpy as np\nimport tensorflow as tf\nfrom tensorflow.keras.layers import Input, Conv2D, MaxPooling2D, Flatten, Dense, Dropout, GlobalAveragePooling2D, BatchNormalization, ReLU, Add\nfrom tensorflow.keras.models import Model\nfrom tensorflow.keras.losses import KLDivergence\nfrom tensorflow.keras.callbacks import ModelCheckpoint, EarlyStopping\nfrom tensorflow.keras.utils import to_categorical\nfrom tensorflow.keras.datasets import cifar10\nfrom tensorflow.keras.applications import EfficientNetB0\nfrom tensorflow.keras.applications import DenseNet121, ResNet50V2\nfrom tensorflow.keras.layers import GlobalAveragePooling2D\nimport copy\nimport numpy as np\nimport tensorflow as tf\nfrom tensorflow.keras.layers import Input, Conv2D, MaxPooling2D, Flatten, Dense, Dropout, GlobalAveragePooling2D, BatchNormalization, ReLU, Add\nfrom tensorflow.keras.models import Model\nfrom tensorflow.keras.losses import KLDivergence\nfrom tensorflow.keras.callbacks import ModelCheckpoint, EarlyStopping\nfrom tensorflow.keras.utils import to_categorical\nfrom tensorflow.keras.datasets import cifar10\nfrom tensorflow.keras.applications import EfficientNetB0\nfrom tensorflow.keras.applications import DenseNet169, MobileNetV2, ResNet50, EfficientNetB0\nfrom tensorflow.keras.layers import GlobalAveragePooling2D\nimport copy\n\nimport tensorflow as tf\nfrom tensorflow.keras import layers\nimport tensorflow as tf\nfrom tensorflow.keras import layers\n","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"X_train_h = np.load('X_train_HAM10000_ISIC_2018.npy')\ny_train_h = np.load('y_train_HAM10000_ISIC_2018.npy')\nX_test_h = np.load('X_test_HAM10000_ISIC_2018.npy')\ny_test_h = np.load('y_test_HAM10000_ISIC_2018.npy')\n\n\nX_train_h.shape, y_train_h.shape, X_test_h.shape, y_test_h.shape\n","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"random_indices = np.random.choice(2003, 810, replace=False)\n\nX_test_h1 = X_test_h[random_indices]\ny_test_h1 = y_test_h[random_indices]\n\nX_test_h1.shape, y_test_h1.shape, X_test_h.shape, y_test_h.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"#X_train_s.shape,X_test_s.shape, y_train_s.shape,y_test_s.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"X_train_h.shape, y_train_h.shape, X_test_h.shape, y_test_h.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"X_train_s = np.load('data_cervical_cancer_sipkamed.npy')\ny_train_s = np.load('labels_cervical_cancer_sipkamed.npy')\n\nX_train_s.shape, y_train_s.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"from sklearn.model_selection import train_test_split\n\nX_train_s, X_test_s, y_train_s, y_test_s = train_test_split(X_train_s, y_train_s, test_size=0.2, random_state=42)\n\nX_train_s.shape,X_test_s.shape, y_train_s.shape,y_test_s.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"import numpy as np\nimport cv2\n\ndef rotate_image(image, angle):\n \"\"\"\n Rotate the image by the specified angle.\n \"\"\"\n center = tuple(np.array(image.shape[1::-1]) / 2)\n rotation_matrix = cv2.getRotationMatrix2D(center, angle, 1.0)\n rotated_image = cv2.warpAffine(image, rotation_matrix, image.shape[1::-1], flags=cv2.INTER_LINEAR)\n return rotated_image\n\ndef translate_image(image, tx, ty):\n \"\"\"\n Translate the image by the specified translation parameters.\n \"\"\"\n translation_matrix = np.float32([[1, 0, tx], [0, 1, ty]])\n translated_image = cv2.warpAffine(image, translation_matrix, image.shape[1::-1])\n return translated_image\n\n# Example data\n#X_train = np.random.rand(100, 28, 28) # Assuming 100 images of size 28x28\n#y_train = np.random.randint(0, 10, 100) # Assuming 100 labels\n\n# Augmentation parameters\nrotation_angles = [20]\ntranslations = [(5, 5)]\n\naugmented_X_train = []\naugmented_y_train = []\n\nfor image, label in zip(X_train_s, y_train_s):\n # Original image\n #augmented_X_train.append(image)\n #augmented_y_train.append(label)\n\n # Augment with rotations\n for angle in rotation_angles:\n rotated_image = rotate_image(image, angle)\n augmented_X_train.append(rotated_image)\n augmented_y_train.append(label)\n\n # Augment with translations\n for tx, ty in translations:\n translated_image = translate_image(image, tx, ty)\n augmented_X_train.append(translated_image)\n augmented_y_train.append(label)\n\n# Convert lists to numpy arrays\naugmented_X_train = np.array(augmented_X_train)\naugmented_y_train = np.array(augmented_y_train)\n\n# Shuffle the data\nshuffle_indices = np.random.permutation(len(augmented_X_train))\naugmented_X_train = augmented_X_train[shuffle_indices]\naugmented_y_train = augmented_y_train[shuffle_indices]\naugmented_X_train.shape, augmented_y_train.shape\n# Now, augmented_X_train and augmented_y_train contain the augmented dataset.","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"random_indices = np.random.choice(6478, 4773, replace=False)\n\naugmented_X_train = augmented_X_train[random_indices]\naugmented_y_train = augmented_y_train[random_indices]\n\naugmented_X_train.shape, augmented_y_train.shape\n","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"X_train_s = np.concatenate((X_train_s, augmented_X_train), axis=0)\ny_train_s = np.concatenate((y_train_s, augmented_y_train), axis=0)\nX_train_s.shape, y_train_s.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"'''X_train_s = np.concatenate((X_train_s, X_train_s, X_train_s), axis=0)\ny_train_s = np.concatenate((y_train_s, y_train_s, y_train_s), axis=0)\nX_train_s.shape, y_train_s.shape'''","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"X_test_s1 = np.concatenate((X_test_s, X_test_s, X_test_s), axis=0)\ny_test_s1 = np.concatenate((y_test_s, y_test_s, y_test_s), axis=0)\nX_test_s1.shape, y_test_s1.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"X_train_s.shape, y_train_s.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"augmented_X_train.shape, augmented_y_train.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"random_indices = np.random.choice(2430, 2003, replace=False)\n\nX_test_s1 = X_test_s1[random_indices]\ny_test_s1 = y_test_s1[random_indices]\n\nX_test_s1.shape, y_test_s1.shape, X_test_s.shape, y_test_s.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"#X_train.shape, y_train.shape, X_test.shape, y_test.shape, \nX_train_s.shape,X_test_s.shape, y_train_s.shape,y_test_s.shape, X_test_s1.shape, y_test_s1.shape","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"print(X_train_h.shape, y_train_h.shape, X_test_h.shape, y_test_h.shape,\n#X_train.shape, y_train.shape, X_test.shape, y_test.shape,\nX_train_s.shape,X_test_s.shape, X_test_s1.shape, y_train_s.shape,y_test_s.shape, y_test_s1.shape)","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"markdown","source":"**Multi-branch fusion attention (MFA) module**","metadata":{}},{"cell_type":"code","source":"#### Multi-branch fusion attention (MFA) module #####\n\nclass DeeperGlobalLocalAttentionLayer1(layers.Layer):\n def __init__(self, units, activation='sigmoid', dropout_rate=0.2, use_scale=True, axis=-1, **kwargs):\n super(DeeperGlobalLocalAttentionLayer1, self).__init__(**kwargs)\n self.units = units\n self.activation = activation\n self.dropout_rate = dropout_rate\n self.use_scale = use_scale\n self.axis = axis\n\n def build(self, input_shape):\n _, _, _, channels = input_shape\n self.global_conv1 = layers.Conv2D(filters=self.units, kernel_size=(1, 1), activation=self.activation)\n self.global_avg_pooling1 = layers.GlobalAveragePooling2D()\n \n self.global_conv2 = layers.Conv2D(filters=self.units, kernel_size=(1, 1), activation=self.activation)\n self.global_avg_pooling2 = layers.GlobalMaxPooling2D()\n \n self.global_conv3 = layers.Conv2D(filters=self.units, kernel_size=(1, 1), activation=self.activation)\n self.global_avg_pooling3 = layers.GlobalAveragePooling2D()\n \n self.global_conv4 = layers.Conv2D(filters=self.units, kernel_size=(1, 1), activation=self.activation)\n self.global_avg_pooling4 = layers.GlobalMaxPooling2D()\n \n self.concat1 = layers.Add()\n self.concat2 = layers.Add()\n self.concat3 = layers.Add()\n self.concat4 = layers.Add()\n self.concat5 = layers.Concatenate(axis=-1)\n \n self.global_attention = layers.Dense(units=self.units, activation=self.activation)\n \n self.local_conv1 = layers.Conv2D(filters=self.units, kernel_size=(1, 1), activation=self.activation)\n self.local_conv2 = layers.Conv2D(filters=self.units, kernel_size=(1, 1), activation=self.activation)\n self.concat6 = layers.Add()\n \n if self.use_scale:\n self.global_scale = self.add_weight(shape=(1, 1, 1, 1), initializer='ones', trainable=True, name='global_scale')\n self.local_scale = self.add_weight(shape=(1, 1, 1, self.units), initializer='ones', trainable=True, name='local_scale')\n \n super(DeeperGlobalLocalAttentionLayer1, self).build(input_shape)\n\n def call(self, inputs, training=None):\n ##### Hierarchical Information Fusion Attention(HIFA) ######\n \n global_attention1 = self.global_conv1(inputs)\n global_avg1 = self.global_avg_pooling1(global_attention1)\n \n global_attention2 = self.global_conv2(global_attention1)\n global_avg2 = self.global_avg_pooling2(global_attention2)\n \n global_concat1 = self.concat1([global_avg1, global_avg2])\n global_attention_concat1 = self.concat2([global_attention1, global_attention2])\n \n global_attention3 = self.global_conv3(global_attention_concat1)\n global_avg3 = self.global_avg_pooling3(global_attention3)\n \n global_attention4 = self.global_conv4(global_attention3)\n global_avg4 = self.global_avg_pooling4(global_attention4)\n \n global_concat2 = self.concat3([global_avg3, global_avg4])\n global_attention_concat2 = self.concat4([global_attention3, global_attention4])\n \n global_avg_concat = self.concat5([global_concat1, global_concat2])\n \n global_attention = self.global_attention(global_avg_concat)\n global_attention = tf.expand_dims(tf.expand_dims(global_attention, 1), 1)\n\n ##### Channel-wise Local Information Attention (CLIA) ######\n \n local_attention1 = self.local_conv1(inputs)\n local_attention1 = tf.reduce_mean(local_attention1, axis=[1, 2], keepdims=True) # Reduce spatial dimensions\n local_attention2 = self.local_conv2(local_attention1)\n local_attention2 = tf.reduce_mean(local_attention2, axis=[1, 2], keepdims=True) # Reduce spatial dimensions\n \n local_attention = self.concat6([local_attention1, local_attention2])\n \n # Scale Global and Local Attention\n if self.use_scale:\n global_attention *= self.global_scale\n local_attention *= self.local_scale\n\n # Combine Global and Local Attention\n attention = tf.sigmoid(global_attention + local_attention)\n return attention\n\n def get_config(self):\n config = super(DeeperGlobalLocalAttentionLayer1, self).get_config()\n config.update({'units': self.units, 'activation': self.activation, 'dropout_rate': self.dropout_rate,\n 'use_scale': self.use_scale})\n return config\n\nclass DeeperAttentionLayer1(layers.Layer):\n def __init__(self, units=64, use_scale=True, **kwargs):\n super(DeeperAttentionLayer1, self).__init__(**kwargs)\n self.units = units\n self.use_scale = use_scale\n\n def build(self, input_shape):\n _, H, W, C = input_shape\n self.alpha = self.add_weight(shape=(1, 1, 1, C), initializer='ones', trainable=True, name='alpha')\n self.deeper_global_local_attention = DeeperGlobalLocalAttentionLayer1(units=self.units, activation='sigmoid', \n dropout_rate=0.2, # You can adjust the dropout rate\n use_scale=self.use_scale)\n super(DeeperAttentionLayer1, self).build(input_shape)\n\n def call(self, inputs, training=None):\n attention = self.deeper_global_local_attention(inputs, training=training)\n attention_feature = inputs * attention * self.alpha\n return attention_feature\n\n def get_config(self):\n config = super(DeeperAttentionLayer1, self).get_config()\n config.update({'units': self.units, 'use_scale': self.use_scale})\n return config\n","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"markdown","source":"**Multimodal information fusion attention (MIFA)**","metadata":{}},{"cell_type":"code","source":"########## Multimodal information fusion attention (MIFA) ###############\n\n\n\nclass GlobalMinPooling2D(layers.Layer):\n def __init__(self, **kwargs):\n super(GlobalMinPooling2D, self).__init__(**kwargs)\n\n def call(self, inputs):\n return tf.reduce_min(inputs, axis=[1, 2])\n\n def compute_output_shape(self, input_shape):\n return (input_shape[0], input_shape[-1])\n\n def get_config(self):\n config = super(GlobalMinPooling2D, self).get_config()\n return config\n\n\nclass DeeperGlobalLocalAttentionLayer(layers.Layer):\n def __init__(self, units, activation='sigmoid', dropout_rate=0.2, use_scale=True, axis=-1, **kwargs):\n super(DeeperGlobalLocalAttentionLayer, self).__init__(**kwargs)\n self.units = units\n self.activation = activation\n self.dropout_rate = dropout_rate\n self.use_scale = use_scale\n self.axis = axis\n\n def build(self, input_shapes):\n input_shape1, input_shape2 = input_shapes\n _, _, _, channels1 = input_shape1\n _, _, _, channels2 = input_shape2\n \n self.global_min_pooling1 = GlobalMinPooling2D()\n self.global_avg_pooling1 = layers.GlobalAveragePooling2D()\n self.global_max_pooling1 = layers.GlobalMaxPooling2D()\n \n self.global_attention = layers.Dense(units=self.units, activation=self.activation)\n \n self.global_min_pooling2 = GlobalMinPooling2D()\n self.global_avg_pooling2 = layers.GlobalAveragePooling2D()\n self.global_max_pooling2 = layers.GlobalMaxPooling2D()\n \n #self.global_attention2 = layers.Dense(units=self.units, activation=self.activation)\n \n \n self.concat = layers.Add()\n #self.global_attention3 = layers.Dense(units=self.units, activation=self.activation)\n \n self.local_conv1 = layers.Conv2D(filters=self.units, kernel_size=(1, 1), activation=self.activation)\n self.local_conv2 = layers.Conv2D(filters=self.units, kernel_size=(1, 1), activation=self.activation)\n \n \n \n self.concat2 = layers.Add()\n #self.local_conv5 = layers.Conv2D(filters=self.units, kernel_size=(1, 1), activation=self.activation)\n \n if self.use_scale:\n self.global_scale = self.add_weight(shape=(1, 1, 1, 1), initializer='ones', trainable=True, name='global_scale')\n self.local_scale = self.add_weight(shape=(1, 1, 1, self.units), initializer='ones', trainable=True, name='local_scale')\n \n super(DeeperGlobalLocalAttentionLayer, self).build(input_shapes)\n\n def call(self, inputs, training=None):\n inputs1, inputs2 = inputs\n\n ######### Multimodal Global Information Fusion Attention (MGIFA) #########\n global_min1 = self.global_min_pooling1(inputs1)\n global_avg1 = self.global_avg_pooling1(inputs1)\n global_max1 = self.global_max_pooling1(inputs1)\n\n global_min2 = self.global_min_pooling2(inputs2)\n global_avg2 = self.global_avg_pooling2(inputs2)\n global_max2 = self.global_max_pooling2(inputs2)\n\n concat_min = self.concat([global_min1, global_min2])\n concat_avg = self.concat([global_avg1, global_avg2])\n concat_max = self.concat([global_max1, global_max2])\n \n concat_min = self.global_attention(concat_min)\n concat_avg = self.global_attention(concat_avg)\n concat_max = self.global_attention(concat_max)\n \n concat_global_attention = self.concat([concat_min, concat_avg, concat_max])\n \n #global_attention = self.global_attention3(concat_global_attention)\n \n global_attention = tf.expand_dims(tf.expand_dims(concat_global_attention, 1), 1)\n\n ######### Multimodal Local Information Fusion Attention (MLIFA) #########\n \n local_conv1 = self.local_conv1(inputs1)\n local_min1 = tf.reduce_min(local_conv1, axis=[1, 2], keepdims=True) # Reduce spatial dimensions\n local_avg1 = tf.reduce_mean(local_conv1, axis=[1, 2], keepdims=True) # Reduce spatial dimensions\n local_max1 = tf.reduce_max(local_conv1, axis=[1, 2], keepdims=True) # Reduce spatial dimensions\n \n local_conv2 = self.local_conv2(inputs2)\n local_min2 = tf.reduce_min(local_conv2, axis=[1, 2], keepdims=True) # Reduce spatial dimensions\n local_avg2 = tf.reduce_mean(local_conv2, axis=[1, 2], keepdims=True) # Reduce spatial dimensions\n local_max2 = tf.reduce_max(local_conv2, axis=[1, 2], keepdims=True) # Reduce spatial dimensions\n \n local_concat_min = self.concat2([local_min1, local_min2])\n local_concat_avg = self.concat2([local_avg1, local_avg2])\n local_concat_max = self.concat2([local_max1, local_max2])\n\n local_attention = self.concat2([local_concat_min, local_concat_avg, local_concat_max])\n \n \n # Scale Global and Local Attention\n if self.use_scale:\n global_attention *= self.global_scale\n local_attention *= self.local_scale\n\n # Combine Global and Local Attention\n attention = tf.sigmoid(global_attention + local_attention)\n return attention\n\n def get_config(self):\n config = super(DeeperGlobalLocalAttentionLayer, self).get_config()\n config.update({'units': self.units, 'activation': self.activation, 'dropout_rate': self.dropout_rate,\n 'use_scale': self.use_scale})\n return config\n\nclass DeeperAttentionLayer(layers.Layer):\n def __init__(self, units=64, use_scale=True,axis=-1, **kwargs):\n super(DeeperAttentionLayer, self).__init__(**kwargs)\n self.units = units\n self.use_scale = use_scale\n self.axis = axis \n\n def build(self, input_shapes):\n input_shape1, input_shape2 = input_shapes\n _, H, W, C1 = input_shape1\n _, H, W, C2 = input_shape2\n \n self.alpha1 = self.add_weight(shape=(1, 1, 1, C1), initializer='ones', trainable=True, name='alpha1')\n self.alpha2 = self.add_weight(shape=(1, 1, 1, C2), initializer='ones', trainable=True, name='alpha2')\n \n self.deeper_global_local_attention = DeeperGlobalLocalAttentionLayer(units=self.units, activation='sigmoid', \n dropout_rate=0.2, # You can adjust the dropout rate\n use_scale=self.use_scale)\n #self.concat3 = layers.Add()\n #self.concat4 = layers.Add()\n \n super(DeeperAttentionLayer, self).build(input_shapes)\n\n def call(self, inputs, training=None):\n inputs1, inputs2 = inputs\n attention = self.deeper_global_local_attention([inputs1, inputs2], training=training)\n \n #inputs_concat = self.concat3([inputs1, inputs2])\n #alpha_concat = self.concat4([self.alpha1, self.alpha2])\n \n attention_feature1 = inputs1 * attention * self.alpha1\n attention_feature2 = inputs2 * attention * self.alpha2\n \n return attention_feature1, attention_feature2\n\n def get_config(self):\n config = super(DeeperAttentionLayer, self).get_config()\n config.update({'units': self.units, 'use_scale': self.use_scale})\n return config\n","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"### RRA block ########\n\ndef RGSA(x, filters, strides=(1, 1), use_projection=False):\n shortcut = x\n\n # Define the first convolutional layer of the block\n \n x = Conv2D(filters=filters, kernel_size=(3, 3), strides=strides, padding='same', \n #activation = 'relu'\n\n )(x)\n x = DeeperAttentionLayer1(units=filters, use_scale=True)(x)\n x = BatchNormalization()(x)\n x = tf.keras.layers.Activation('relu')(x)\n\n # Define the second convolutional layer of the block\n \n x = Conv2D(filters=filters, kernel_size=(3, 3), padding='same')(x)\n x = DeeperAttentionLayer1(units=filters, use_scale=True)(x)\n \n x = BatchNormalization()(x)\n\n # If the stride is not (1, 1), the dimensions need to be adjusted\n if strides != (1, 1) or use_projection:\n \n shortcut = Conv2D(filters=filters, kernel_size=(1, 1), strides=strides, padding='same')(shortcut)\n shortcut = BatchNormalization()(shortcut)\n\n # Add the shortcut (identity connection)\n \n x = tf.keras.layers.add([x, shortcut])\n \n x = tf.keras.layers.Activation('relu')(x)\n return x\n","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"markdown","source":"**DRIFA-Net**","metadata":{}},{"cell_type":"code","source":"def residual_GLC_branch1(inputs1, inputs2):\n \n x1 = Conv2D(filters=64, kernel_size=(7, 7), strides=(2, 2), padding='same')(inputs1)\n x1 = DeeperAttentionLayer1(units=64, use_scale=True)(x1) ## MFA ####\n x1 = BatchNormalization()(x1)\n x1 = tf.keras.layers.Activation('relu')(x1)\n x1 = MaxPooling2D(pool_size=(3, 3), strides=(2, 2), padding='same')(x1)\n \n x2 = Conv2D(filters=64, kernel_size=(7, 7), strides=(2, 2), padding='same')(inputs2)\n x2 = DeeperAttentionLayer1(units=64, use_scale=True)(x2) ## MFA ####\n x2 = BatchNormalization()(x2)\n x2 = tf.keras.layers.Activation('relu')(x2)\n x2 = MaxPooling2D(pool_size=(3, 3), strides=(2, 2), padding='same')(x2)\n \n\n x1 = RGSA(x1, filters=64)\n x1 = tf.keras.layers.Dropout(0.25)(x1, training = True) ## MCD ####\n x1 = DeeperAttentionLayer1(units=64, use_scale=True)(x1) ## MFA ####\n\n x2 = RGSA(x2, filters=64)\n x2 = tf.keras.layers.Dropout(0.25)(x2, training = True) ## MCD ####\n x2 = DeeperAttentionLayer1(units=64, use_scale=True)(x2)\n \n x1, x2 = DeeperAttentionLayer(units=64, use_scale=True)([x1, x2]) ## MIFA ####\n \n x1 = RGSA(x1, filters=64)\n x1 = tf.keras.layers.Dropout(0.25)(x1, training = True) ## MCD ####\n x1 = DeeperAttentionLayer1(units=64, use_scale=True)(x1) ## MFA ####\n \n x2 = RGSA(x2, filters=64)\n x2 = tf.keras.layers.Dropout(0.25)(x2, training = True) ## MCD ####\n x2 = DeeperAttentionLayer1(units=64, use_scale=True)(x2)\n\n x1, x2 = DeeperAttentionLayer(units=64, use_scale=True)([x1, x2]) ## MIFA ####\n \n x1 = RGSA(x1, filters=128, strides=(2, 2), use_projection=True)\n x1 = tf.keras.layers.Dropout(0.25)(x1, training = True) ## MCD ####\n x1 = DeeperAttentionLayer1(units=128, use_scale=True)(x1) ## MFA ####\n\n x2 = RGSA(x2, filters=128, strides=(2, 2), use_projection=True)\n x2 = tf.keras.layers.Dropout(0.25)(x2, training = True) ## MCD ####\n x2 = DeeperAttentionLayer1(units=128, use_scale=True)(x2)\n\n x1, x2 = DeeperAttentionLayer(units=128, use_scale=True)([x1, x2]) ## MIFA ####\n \n x1 = RGSA(x1, filters=128)\n x1 = tf.keras.layers.Dropout(0.25)(x1, training = True) ## MCD ####\n x1 = DeeperAttentionLayer1(units=128, use_scale=True)(x1)\n \n x2 = RGSA(x2, filters=128)\n x2 = tf.keras.layers.Dropout(0.25)(x2, training = True) ## MCD ####\n x2 = DeeperAttentionLayer1(units=128, use_scale=True)(x2)\n\n x1, x2 = DeeperAttentionLayer(units=128, use_scale=True)([x1, x2]) ## MIFA ####\n \n x1 = RGSA(x1, filters=256, strides=(2, 2), use_projection=True)\n x1 = tf.keras.layers.Dropout(0.25)(x1, training = True) ## MCD ####\n x1 = DeeperAttentionLayer1(units=256, use_scale=True)(x1)\n \n x2 = RGSA(x2, filters=256, strides=(2, 2), use_projection=True)\n x2 = tf.keras.layers.Dropout(0.25)(x2, training = True) ## MCD ####\n x2 = DeeperAttentionLayer1(units=256, use_scale=True)(x2)\n\n x1, x2 = DeeperAttentionLayer(units=256, use_scale=True)([x1, x2]) ## MIFA ####\n \n \n x1 = RGSA(x1, filters=256)\n x1 = tf.keras.layers.Dropout(0.25)(x1, training = True) ## MCD ####\n x1 = DeeperAttentionLayer1(units=256, use_scale=True)(x1)\n \n x2 = RGSA(x2, filters=256)\n x2 = tf.keras.layers.Dropout(0.25)(x2, training = True) ## MCD ####\n x2 = DeeperAttentionLayer1(units=256, use_scale=True)(x2)\n \n x1, x2 = DeeperAttentionLayer(units=256, use_scale=True)([x1, x2]) ## MIFA ####\n\n x1 = RGSA(x1, filters=512, strides=(2, 2), use_projection=True)\n x1 = DeeperAttentionLayer1(units=512, use_scale=True)(x1)\n \n x2 = RGSA(x2, filters=512, strides=(2, 2), use_projection=True)\n x2 = DeeperAttentionLayer1(units=512, use_scale=True)(x2)\n\n x1, x2 = DeeperAttentionLayer(units=512, use_scale=True)([x1, x2]) ## MIFA ####\n \n x1 = RGSA(x1, filters=512)\n x2 = RGSA(x2, filters=512)\n x1, x2 = DeeperAttentionLayer(units=512, use_scale=True)([x1, x2])\n \n return x1, x2","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"#def build_resnet18(input_shape=(128, 128, 3), num_classes=2):\ninput_shape=(128, 128, 3)\ninputs1 = Input(shape=input_shape)\ninputs2 = Input(shape=input_shape)\n\n\n\n#input_data = Input(shape=input_shape, name='input_data')\n# Initial convolutional layer\n\nx1, x2 = residual_GLC_branch1(inputs1, inputs2)\n#print('x:',x.shape)\n\ncon = tf.keras.layers.Concatenate(axis=-1)([x1, x2])\n\ncon = tf.keras.layers.Dropout(0.25)(con, training = True) ## MCD ####\n\nx = GlobalAveragePooling2D()(con)\nprint('GlobalAveragePooling2D x:',x.shape)\n\noutputs1 = Dense(5, activation='softmax')(x)\noutputs2 = Dense(7, activation='softmax')(x)\n\n# Create the model\nmodel = Model([inputs1, inputs2], [outputs1, outputs2])\n#return model\nprint(model.summary())","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"from tensorflow.keras.optimizers import Adam\nfrom tensorflow.keras.optimizers.schedules import ExponentialDecay\n\ninitial_gamma = 0.5\n\noptimizer = Adam(learning_rate=0.001)\n# Compile the model with the custom optimizer\nmodel.compile(optimizer=optimizer,\n loss=['categorical_crossentropy', 'categorical_crossentropy'],\n loss_weights=[initial_gamma, (1 - initial_gamma)],\n metrics=['accuracy', 'accuracy'])\n\n\nfrom tensorflow.keras.callbacks import ModelCheckpoint, EarlyStopping\ndef checkpoint_callback():\n\n checkpoint_filepath = 'best1_model_cer_skin_lung.keras'\n\n model_checkpoint_callback= ModelCheckpoint(filepath=checkpoint_filepath,\n save_weights_only=False,\n #frequency='epoch',\n monitor='val_loss',\n save_best_only=True,\n mode='min',\n verbose=0)\n\n return model_checkpoint_callback\n\ndef early_stopping(patience):\n es_callback = tf.keras.callbacks.EarlyStopping(monitor='val_loss', patience=patience, verbose=1)\n return es_callback\n\n\n\nfrom tensorflow.keras.callbacks import ReduceLROnPlateau\n\nreduce_lr = ReduceLROnPlateau(monitor='val_loss', factor=0.2,\n patience=5, min_lr=0.00001)\n\ncheckpoint_callback = checkpoint_callback()\n\nearly_stopping = early_stopping(patience=100)\ncallbacks = [checkpoint_callback, early_stopping, reduce_lr]\n \n\n# Fit the model with callbacks\nhistory = model.fit([X_train_s, X_train_h], [y_train_s, y_train_h],\n epochs=200,\n validation_split=0.2, verbose=1,\n shuffle=True,\n callbacks=callbacks) # UpdateGammaCallback\n","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"model.evaluate([X_test_s, X_test_h1], [y_test_s, y_test_h1])","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"\nmodel.evaluate([X_test_s1, X_test_h], [y_test_s1, y_test_h])","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"y_pred = model.predict([X_test_s1, X_test_h]) \n\ny_pred_binary1 = y_pred[0] >= 0.5\ny_pred_binary_pgd_test1 = np.array(y_pred_binary1, dtype='int32')\n\nprint('y_pred_binary_pgd_test1:', y_pred_binary_pgd_test1.shape)\n\ny_pred_binary2 = y_pred[1] >= 0.5\ny_pred_binary_pgd_test2 = np.array(y_pred_binary2, dtype='int32')\n\nprint('y_pred_binary_pgd_test2:', y_pred_binary_pgd_test2.shape)\n\n#y_test_s, y_test_h\n# Calculate evaluation metrics for the current epsilon\ny_test_categorical1 = y_test_s1\ny_test_categorical2 = y_test_h\n\n## Task 1:\nprint('skin cancer classification:')\naccuracy = accuracy_score(y_pred_binary_pgd_test1, y_test_categorical1) * 100\nprecision = precision_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\nrecall = recall_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\nf1 = f1_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\n#auc = roc_auc_score(y_pred, y_train_categorical, multi_class='ovr') * 100\nprint('accuracy:', accuracy)\nprint('precision:', precision)\nprint('recall:', recall)\nprint('f1:', f1)\n\n## Task 2:\nprint('Cervical cancer classification:')\naccuracy = accuracy_score(y_pred_binary_pgd_test2, y_test_categorical2) * 100\nprecision = precision_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nrecall = recall_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nf1 = f1_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nprint('accuracy:', accuracy)\nprint('precision:', precision)\nprint('recall:', recall)\nprint('f1:', f1)","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"history = model.fit([X_train_s, X_train_h], [y_train_s, y_train_h],\n epochs=100,\n validation_split=0.2, verbose=1,\n shuffle=True,\n callbacks=callbacks)","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"model.evaluate([X_test_s, X_test_h1], [y_test_s, y_test_h1])","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"from tensorflow.keras.models import load_model\n\nmodel1 = load_model('/kaggle/working/best1_model_cer_skin_lung.keras', custom_objects={'DeeperAttentionLayer1': DeeperAttentionLayer1,\n 'DeeperAttentionLayer': DeeperAttentionLayer\n })\nmodel1.evaluate([X_test_s, X_test_h1], [y_test_s, y_test_h1])","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"model.evaluate([X_test_s1, X_test_h], [y_test_s1, y_test_h])","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"y_pred = model.predict([X_test_s1, X_test_h]) \n\ny_pred_binary1 = y_pred[0] >= 0.5\ny_pred_binary_pgd_test1 = np.array(y_pred_binary1, dtype='int32')\n\nprint('y_pred_binary_pgd_test1:', y_pred_binary_pgd_test1.shape)\n\ny_pred_binary2 = y_pred[1] >= 0.5\ny_pred_binary_pgd_test2 = np.array(y_pred_binary2, dtype='int32')\n\nprint('y_pred_binary_pgd_test2:', y_pred_binary_pgd_test2.shape)\n\n#y_test_s, y_test_h\n# Calculate evaluation metrics for the current epsilon\ny_test_categorical1 = y_test_s1\ny_test_categorical2 = y_test_h\n\n## Task 1:\nprint('skin cancer classification:')\naccuracy = accuracy_score(y_pred_binary_pgd_test1, y_test_categorical1) * 100\nprecision = precision_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\nrecall = recall_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\nf1 = f1_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\n#auc = roc_auc_score(y_pred, y_train_categorical, multi_class='ovr') * 100\nprint('accuracy:', accuracy)\nprint('precision:', precision)\nprint('recall:', recall)\nprint('f1:', f1)\n\n## Task 2:\nprint('Cervical cancer classification:')\naccuracy = accuracy_score(y_pred_binary_pgd_test2, y_test_categorical2) * 100\nprecision = precision_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nrecall = recall_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nf1 = f1_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nprint('accuracy:', accuracy)\nprint('precision:', precision)\nprint('recall:', recall)\nprint('f1:', f1)","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"y_pred = model.predict([X_test_s, X_test_h1]) \n\ny_pred_binary1 = y_pred[0] >= 0.5\ny_pred_binary_pgd_test1 = np.array(y_pred_binary1, dtype='int32')\n\nprint('y_pred_binary_pgd_test1:', y_pred_binary_pgd_test1.shape)\n\ny_pred_binary2 = y_pred[1] >= 0.5\ny_pred_binary_pgd_test2 = np.array(y_pred_binary2, dtype='int32')\n\nprint('y_pred_binary_pgd_test2:', y_pred_binary_pgd_test2.shape)\n\n#y_test_s, y_test_h\n# Calculate evaluation metrics for the current epsilon\ny_test_categorical1 = y_test_s\ny_test_categorical2 = y_test_h1\n\n## Task 1:\nprint('skin cancer classification:')\naccuracy = accuracy_score(y_pred_binary_pgd_test1, y_test_categorical1) * 100\nprecision = precision_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\nrecall = recall_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\nf1 = f1_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\n#auc = roc_auc_score(y_pred, y_train_categorical, multi_class='ovr') * 100\nprint('accuracy:', accuracy)\nprint('precision:', precision)\nprint('recall:', recall)\nprint('f1:', f1)\n\n## Task 2:\nprint('Cervical cancer classification:')\naccuracy = accuracy_score(y_pred_binary_pgd_test2, y_test_categorical2) * 100\nprecision = precision_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nrecall = recall_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nf1 = f1_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nprint('accuracy:', accuracy)\nprint('precision:', precision)\nprint('recall:', recall)\nprint('f1:', f1)","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"model.save('best_model_ever.keras')","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"","metadata":{"trusted":true},"outputs":[],"execution_count":null}]}
--------------------------------------------------------------------------------
/uncertainty-quantification-of-drifa-net.ipynb:
--------------------------------------------------------------------------------
1 | {"metadata":{"kernelspec":{"name":"python3","display_name":"Python 3","language":"python"},"language_info":{"name":"python","version":"3.10.12","mimetype":"text/x-python","codemirror_mode":{"name":"ipython","version":3},"pygments_lexer":"ipython3","nbconvert_exporter":"python","file_extension":".py"},"kaggle":{"accelerator":"gpu","dataSources":[],"dockerImageVersionId":30823,"isInternetEnabled":true,"language":"python","sourceType":"notebook","isGpuEnabled":true}},"nbformat_minor":4,"nbformat":4,"cells":[{"cell_type":"markdown","source":"# 1. Import needed libraries","metadata":{}},{"cell_type":"code","source":"import os\nfrom PIL import Image\nimport numpy as np\nimport pandas as pd\nimport matplotlib.pyplot as plt\nimport seaborn as sns\nfrom glob import glob\n#---------------------------------------\nfrom sklearn.model_selection import train_test_split\nfrom sklearn.metrics import classification_report, confusion_matrix\n#---------------------------------------\nimport tensorflow as tf\nfrom tensorflow.keras.models import Sequential\nfrom tensorflow.keras.layers import Dense, Dropout, Flatten\nfrom tensorflow.keras.optimizers import Adamax\nfrom tensorflow.keras.metrics import Precision, Recall\nfrom tensorflow.keras.preprocessing.image import ImageDataGenerator\n#---------------------------------------\nimport warnings\nwarnings.filterwarnings(\"ignore\")","metadata":{"_cell_guid":"b1076dfc-b9ad-4769-8c92-a6c4dae69d19","_uuid":"8f2839f25d086af736a60e9eeb907d3b93b6e0e5","trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"img_rows, img_cols = 128, 128\ninput_shape = (img_rows, img_cols, 3)\n\n#n_classes = df['category'].nunique()\nn_classes = 4\nprint('Total number of unique categories:', n_classes)\n\nfrom os import listdir, makedirs\nfrom os.path import isfile, join, basename, splitext, isfile, exists\n\nimport numpy as np\nimport pandas as pd\n\nfrom tqdm import tqdm_notebook\n\nimport tensorflow as tf\nimport keras.backend as K\n\nimport keras\nfrom keras.models import Sequential, Model\nfrom keras.layers import Dropout, Dense, Flatten, BatchNormalization\nfrom keras.layers import DepthwiseConv2D, SeparableConvolution2D, Convolution2D, Conv2D,GRU, LSTM, AlphaDropout, Embedding, ZeroPadding2D,AveragePooling2D, MaxPooling2D, GlobalAveragePooling2D, GlobalMaxPooling2D, Dropout\nfrom keras.layers import Concatenate, Average, Maximum, Bidirectional, TimeDistributed\nfrom keras.callbacks import Callback, EarlyStopping, ModelCheckpoint\n#from keras.engine.input_layer import Input\nfrom keras.models import load_model\n#from keras.initializers import LecunNormal\n\nimport matplotlib.pyplot as plt\nimport seaborn as sns\n\n#pd.set_option('precision', 30)\nnp.set_printoptions(precision = 30)\n\n\n#tf.set_random_seed(1090)\n\nimport pandas as pd\nimport numpy as np\n\nimport seaborn as sns\nimport matplotlib.pyplot as plt\nimport matplotlib.image as img\n\nimport cv2\nimport itertools\nimport pathlib\nimport warnings\nfrom PIL import Image\nfrom random import randint\nwarnings.filterwarnings('ignore')\n\nfrom imblearn.over_sampling import SMOTE\nfrom sklearn.model_selection import train_test_split\nfrom sklearn.metrics import matthews_corrcoef as MCC\nfrom sklearn.metrics import balanced_accuracy_score as BAS\nfrom sklearn.metrics import classification_report, confusion_matrix\n\n\nfrom tensorflow import keras\nfrom keras import layers\nimport tensorflow as tf\n#import tensorflow_addons as tfa\nfrom tensorflow.keras.preprocessing import image_dataset_from_directory\n##from keras.utils.vis_utils import plot_model\nfrom tensorflow.keras import Sequential, Input\nfrom tensorflow.keras.layers import Dense, Dropout\nfrom tensorflow.keras.layers import Conv2D, Flatten\nfrom tensorflow.keras.callbacks import ReduceLROnPlateau\nfrom tensorflow.keras.applications.inception_v3 import InceptionV3\nfrom tensorflow.keras.preprocessing.image import ImageDataGenerator as IDG\nfrom tensorflow.keras.layers import SeparableConv2D, BatchNormalization, GlobalAveragePooling2D\n\nfrom distutils.dir_util import copy_tree, remove_tree\n\nimport os\n#print(os.listdir(\"../input/alzheimer-mri-dataset/Dataset\"))\nimport tensorflow as tf\nfrom keras.datasets import mnist\nimport cv2\nimport os\nimport pathlib\nfrom keras.layers import Conv2D, Conv2DTranspose,Concatenate, Dropout, Dense, Reshape, LayerNormalization, LeakyReLU\nfrom keras import layers, models\nimport matplotlib.pyplot as plt\nimport numpy as np\nfrom sklearn.metrics import accuracy_score, classification_report\nfrom sklearn.metrics import f1_score, recall_score, precision_score\nprint(\"TensorFlow Version:\", tf.__version__)","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"markdown","source":"### Uncertainty Quantification of DRIFA-Net","metadata":{}},{"cell_type":"code","source":"import numpy as np\nfrom tensorflow.keras.callbacks import ModelCheckpoint\nfrom tensorflow.keras.losses import KLDivergence\n\n# Set a random seed for reproducibility\nnp.random.seed(42)\n\ndef create_ensemble(num_models, input_shape=(128, 128, 3)):\n ensemble_models = []\n \n for _ in range(num_models):\n model = DRIFA_Net(input_shape) # Assuming ResNet18 is defined elsewhere\n ensemble_models.append(model)\n \n return ensemble_models\n\n# Function to perform Monte Carlo Dropout inference\n\n# Example usage\ninput_shape = (128, 128, 3)\nnum_models = 5\ndropout_rate = 0.25\n\nensemble_models = create_ensemble(num_models, input_shape)\n\n# Train each model in the ensemble\nfor i, model in enumerate(ensemble_models):\n print(\"Training Model\", i)\n #model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])\n model.compile(optimizer='adam', loss=[adaptive_knowledge_distillation_loss,\n adaptive_knowledge_distillation_loss,\n adaptive_knowledge_distillation_loss,\n adaptive_knowledge_distillation_loss], \n metrics=['accuracy', 'accuracy', 'accuracy', 'accuracy'])\n\n \n # Define checkpoint callback for each model\n checkpoint = ModelCheckpoint(f\"best_student_models1_covid_brain_{i}.keras\", monitor='val_loss', \n verbose=1, save_best_only=True, mode='min')\n \n model.fit(x = [images_train_brain_mri, images_train_brain_ct, images_train_covid_cxr, images_train_covid_ct], \n y=([soft_prob_brain_mri, soft_prob_brain_ct, soft_prob_covid_cxr, soft_prob_covid_ct]),\n epochs=200,\n #validation_data=([X_val, X_val_c], [y_val, y_val_c]), \n callbacks = [checkpoint],#batch_size=16,\n #validation_split = 0.2\n validation_data = ([X_val_brain_mri, X_val_brain_ct, X_val_covid_cxr, X_val_covid_ct],\n [y_val_brain_mri, y_val_brain_ct, y_val_covid_cxr, y_val_covid_ct]), verbose=0)","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"for i, model in enumerate(ensemble_models):\n model.evaluate([X_test_brain_mri, X_test_brain_ct,X_test_covid_cxr, X_test_covid_ct], \n[y_test_brain_mri,y_test_brain_ct, y_test_covid_cxr, y_test_covid_ct])","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"'''def monte_carlo_dropout_inference(model, x1, x2, x3, x4, num_samples=3):\n predictions = np.zeros((num_samples,) + model.predict([x1, x2, x3, x4],\n verbose = 0).shape)\n print(len(predictions))\n \n for i in range(num_samples):\n print(i)\n predictions[i, :] = model.predict([x1, x2, x3, x4], verbose = 0)\n\n return predictions\n'''\n\ndef monte_carlo_dropout_inference(model, x1, x2, x3, x4, num_samples=30):\n predictions_shape = model.predict([x1, x2, x3, x4], verbose=0)[0].shape\n predictions = np.zeros((num_samples,) + predictions_shape)\n \n for i in range(num_samples):\n predictions[i, :] = model.predict([x1, x2, x3, x4], verbose=0)[0]\n\n return predictions\n# Perform Monte Carlo Dropout inference for each model in the ensemble\nensemble_predictions = []\nfor model in ensemble_models:\n predictions = monte_carlo_dropout_inference(model, X_test_brain_mri, \n X_test_brain_ct,X_test_covid_cxr, X_test_covid_ct)\n ensemble_predictions.append(predictions)\n\n#print('ensemble_predictions:', ensemble_predictions.shape)\n# Take the mean or other aggregation method across the ensemble predictions\n\n","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"final_prediction_model1 = np.mean(ensemble_predictions[0], axis=0)\n\n# Use the final_prediction for further analysis or decision making\nprint(\"final_prediction_model1:\", final_prediction_model1.shape)","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"'''def monte_carlo_dropout_inference(model, x1, x2, x3, x4, num_samples=3):\n predictions = np.zeros((num_samples,) + model.predict([x1, x2, x3, x4],\n verbose = 0).shape)\n print(len(predictions))\n \n for i in range(num_samples):\n print(i)\n predictions[i, :] = model.predict([x1, x2, x3, x4], verbose = 0)\n\n return predictions\n'''\n\ndef monte_carlo_dropout_inference(model, x1, x2, x3, x4, num_samples=30):\n predictions_shape = model.predict([x1, x2, x3, x4], verbose=0)[1].shape\n predictions = np.zeros((num_samples,) + predictions_shape)\n \n for i in range(num_samples):\n predictions[i, :] = model.predict([x1, x2, x3, x4], verbose=0)[1]\n\n return predictions\n# Perform Monte Carlo Dropout inference for each model in the ensemble\nensemble_predictions = []\nfor model in ensemble_models:\n predictions = monte_carlo_dropout_inference(model, X_test_brain_mri, \n X_test_brain_ct,X_test_covid_cxr, X_test_covid_ct)\n ensemble_predictions.append(predictions)\n\n#print('ensemble_predictions:', ensemble_predictions.shape)\n# Take the mean or other aggregation method across the ensemble predictions\n","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"final_prediction_model2 = np.mean(ensemble_predictions[0], axis=0)\n\n# Use the final_prediction for further analysis or decision making\nprint(\"final_prediction_model2:\", final_prediction_model2.shape)","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"'''def monte_carlo_dropout_inference(model, x1, x2, x3, x4, num_samples=3):\n predictions = np.zeros((num_samples,) + model.predict([x1, x2, x3, x4],\n verbose = 0).shape)\n print(len(predictions))\n \n for i in range(num_samples):\n print(i)\n predictions[i, :] = model.predict([x1, x2, x3, x4], verbose = 0)\n\n return predictions\n'''\n\ndef monte_carlo_dropout_inference(model, x1, x2, x3, x4, num_samples=30):\n predictions_shape = model.predict([x1, x2, x3, x4], verbose=0)[2].shape\n predictions = np.zeros((num_samples,) + predictions_shape)\n \n for i in range(num_samples):\n predictions[i, :] = model.predict([x1, x2, x3, x4], verbose=0)[2]\n\n return predictions\n# Perform Monte Carlo Dropout inference for each model in the ensemble\nensemble_predictions = []\nfor model in ensemble_models:\n predictions = monte_carlo_dropout_inference(model, X_test_brain_mri, \n X_test_brain_ct,X_test_covid_cxr, X_test_covid_ct)\n ensemble_predictions.append(predictions)\n\n#print('ensemble_predictions:', ensemble_predictions.shape)\n# Take the mean or other aggregation method across the ensemble predictions\n","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"final_prediction_model3 = np.mean(ensemble_predictions[0], axis=0)\n\n# Use the final_prediction for further analysis or decision making\nprint(\"final_prediction_model3:\", final_prediction_model3.shape)","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"'''def monte_carlo_dropout_inference(model, x1, x2, x3, x4, num_samples=3):\n predictions = np.zeros((num_samples,) + model.predict([x1, x2, x3, x4],\n verbose = 0).shape)\n print(len(predictions))\n \n for i in range(num_samples):\n print(i)\n predictions[i, :] = model.predict([x1, x2, x3, x4], verbose = 0)\n\n return predictions\n'''\n\ndef monte_carlo_dropout_inference(model, x1, x2, x3, x4, num_samples=30):\n predictions_shape = model.predict([x1, x2, x3, x4], verbose=0)[3].shape\n predictions = np.zeros((num_samples,) + predictions_shape)\n \n for i in range(num_samples):\n predictions[i, :] = model.predict([x1, x2, x3, x4], verbose=0)[3]\n\n return predictions\n# Perform Monte Carlo Dropout inference for each model in the ensemble\nensemble_predictions = []\nfor model in ensemble_models:\n predictions = monte_carlo_dropout_inference(model, X_test_brain_mri, \n X_test_brain_ct,X_test_covid_cxr, X_test_covid_ct)\n ensemble_predictions.append(predictions)\n\n#print('ensemble_predictions:', ensemble_predictions.shape)\n# Take the mean or other aggregation method across the ensemble predictions\n","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"final_prediction_model4 = np.mean(ensemble_predictions[0], axis=0)\n\n# Use the final_prediction for further analysis or decision making\nprint(\"final_prediction_model4:\", final_prediction_model4.shape)","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"y_pred_binary_pgd_test1 = np.argmax(final_prediction_model1, axis=1)\ny_pred_binary_pgd_test2 = np.argmax(final_prediction_model2, axis=1)\ny_pred_binary_pgd_test3 = np.argmax(final_prediction_model3, axis=1)\ny_pred_binary_pgd_test4 = np.argmax(final_prediction_model4, axis=1)\n\ny_test_categorical1 = y_test_brain_mri\ny_test_categorical2 = y_test_brain_ct\ny_test_categorical4 = y_test_covid_ct\ny_test_categorical3 = y_test_covid_cxr\n\ny_test_categorical1 = np.argmax(y_test_categorical1, axis=1)\ny_test_categorical2 = np.argmax(y_test_categorical2, axis=1)\ny_test_categorical3 = np.argmax(y_test_categorical3, axis=1)\ny_test_categorical4 = np.argmax(y_test_categorical4, axis=1)\n\n## Task 1:\nprint('Task 1:')\nprint('Brain Tumours classification in MRI images:')\naccuracy = accuracy_score(y_pred_binary_pgd_test1, y_test_categorical1) * 100\nprecision = precision_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\nrecall = recall_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\nf1 = f1_score(y_pred_binary_pgd_test1, y_test_categorical1, average='macro') * 100\n#auc = roc_auc_score(y_pred, y_train_categorical, multi_class='ovr') * 100\nprint('accuracy:', accuracy)\nprint('precision:', precision)\nprint('recall:', recall)\nprint('f1:', f1)\n\n## Task 2:\nprint('Task 2:')\nprint('Brain Stroke classification in CT scan images:')\naccuracy = accuracy_score(y_pred_binary_pgd_test2, y_test_categorical2) * 100\nprecision = precision_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nrecall = recall_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nf1 = f1_score(y_pred_binary_pgd_test2, y_test_categorical2, average='macro') * 100\nprint('accuracy:', accuracy)\nprint('precision:', precision)\nprint('recall:', recall)\nprint('f1:', f1)\n\n## Task 3:\nprint('Task 3:')\nprint('COVID19 classification in CXR images:')\naccuracy = accuracy_score(y_pred_binary_pgd_test3, y_test_categorical3) * 100\nprecision = precision_score(y_pred_binary_pgd_test3, y_test_categorical3, average='macro') * 100\nrecall = recall_score(y_pred_binary_pgd_test3, y_test_categorical3, average='macro') * 100\nf1 = f1_score(y_pred_binary_pgd_test3, y_test_categorical3, average='macro') * 100\n#auc = roc_auc_score(y_pred, y_train_categorical, multi_class='ovr') * 100\nprint('accuracy:', accuracy)\nprint('precision:', precision)\nprint('recall:', recall)\nprint('f1:', f1)\n\n## Task 4:\nprint('Task 4:')\nprint('COVID19 classification in CT scan images:')\naccuracy = accuracy_score(y_pred_binary_pgd_test4, y_test_categorical4) * 100\nprecision = precision_score(y_pred_binary_pgd_test4, y_test_categorical4, average='macro') * 100\nrecall = recall_score(y_pred_binary_pgd_test4, y_test_categorical4, average='macro') * 100\nf1 = f1_score(y_pred_binary_pgd_test4, y_test_categorical4, average='macro') * 100\nprint('accuracy:', accuracy)\nprint('precision:', precision)\nprint('recall:', recall)\nprint('f1:', f1)","metadata":{"trusted":true},"outputs":[],"execution_count":null},{"cell_type":"code","source":"","metadata":{"trusted":true},"outputs":[],"execution_count":null}]}
--------------------------------------------------------------------------------