!pip install tensorflow[and-cuda] numpy==1.25.2 -q

import tensorflow as tf
print("Num GPUs Available:", len(tf.config.list_physical_devices('GPU')))
print(tf.__version__)

Num GPUs Available: 1
2.17.1

import os
import random
import numpy as np                                                                               # Importing numpy for Matrix Operations
import pandas as pd
import seaborn as sns
import matplotlib.image as mpimg                                                                 # Importing pandas to read CSV files
import matplotlib.pyplot as plt                                                                  # Importting matplotlib for Plotting and visualizing images
import math                                                                                      # Importing math module to perform mathematical operations
import cv2


# Tensorflow modules
import keras
import tensorflow as tf
from tensorflow.keras.preprocessing.image import ImageDataGenerator                              # Importing the ImageDataGenerator for data augmentation
from tensorflow.keras.models import Sequential                                                   # Importing the sequential module to define a sequential model
from tensorflow.keras.layers import Dense,Dropout,Flatten,Conv2D,MaxPooling2D,BatchNormalization # Defining all the layers to build our CNN Model
from tensorflow.keras.optimizers import Adam,SGD                                                 # Importing the optimizers which can be used in our model
from sklearn import preprocessing                                                                # Importing the preprocessing module to preprocess the data
from sklearn.model_selection import train_test_split                                             # Importing train_test_split function to split the data into train and test
from sklearn.metrics import confusion_matrix
from tensorflow.keras.models import Model
from keras.applications.vgg16 import VGG16                                                       # Importing confusion_matrix to plot the confusion matrix

# Display images using OpenCV
from google.colab.patches import cv2_imshow

#Imports functions for evaluating the performance of machine learning models
from sklearn.metrics import confusion_matrix, f1_score,accuracy_score, recall_score, precision_score, classification_report
from sklearn.metrics import mean_squared_error as mse                                            # Importing cv2_imshow from google.patches to display images

# Ignore warnings
import warnings
warnings.filterwarnings('ignore')

# Set the seed using keras.utils.set_random_seed. This will set:
# 1) `numpy` seed
# 2) backend random seed
# 3) `python` random seed
tf.keras.utils.set_random_seed(812)

# Uncomment and run the following code in case Google Colab is being used
from google.colab import drive
drive.mount('/content/drive')

Mounted at /content/drive

# Load image data and labels
X = np.load('/content/drive/MyDrive/Colab Notebooks/Project 6/HelmNet_images_proj.npy')  # shape should be (631, H, W, C)
y_df = pd.read_csv('/content/drive/MyDrive/Colab Notebooks/Project 6/HelmNet_Labels_proj.csv')  # should contain binary labels

# Inspect dimensions
print(f"Image Data Shape: {X.shape}")
print(f"Labels DataFrame Shape: {y_df.shape}")
print(y_df.head())

Image Data Shape: (631, 200, 200, 3)
Labels DataFrame Shape: (631, 1)
   Label
0      1
1      1
2      1
3      1
4      1

# Convert labels to a flat Numpy Array to view the classes
y = y_df['Label'].values  # shape will be (631,)
print(f"y shape: {y.shape}")
print(f"Unique classes: {np.unique(y)}")

y shape: (631,)
Unique classes: [0 1]

# Plot the class distribution with Seaborn countplot.
sns.countplot(x=y_df['Label'])
plt.title("Class Distribution: With Helmet (1) vs Without Helmet (0)")
plt.xlabel("Label")
plt.ylabel("Count")
plt.show()

# Show sample images
# Convert to NumPy array if not already
X = np.array(X)
y = np.array(y)

# Find indices for each class
helmet_indices = np.where(y == 1)[0]
no_helmet_indices = np.where(y == 0)[0]

# Pick 5 random indices from each
helmet_samples = random.sample(list(helmet_indices), 5)
no_helmet_samples = random.sample(list(no_helmet_indices), 5)

# Plot images without helmet
plt.figure(figsize=(15, 4))
for i, idx in enumerate(no_helmet_samples):
    plt.subplot(2, 5, i+1)
    plt.imshow(X[idx].squeeze(), cmap='gray' if X.shape[-1] == 1 else None) # Ensures any grayscale images are shown correctly
    plt.title("No Helmet")
    plt.axis('off')

# Plot images with helmet
for i, idx in enumerate(helmet_samples):
    plt.subplot(2, 5, i+6)
    plt.imshow(X[idx].squeeze(), cmap='gray' if X.shape[-1] == 1 else None)
    plt.title("With Helmet")
    plt.axis('off')

plt.suptitle("Sample Images by Class", fontsize=16)
plt.tight_layout()
plt.show()

# Convert RGB images to Grayscale
X_gray = np.array([cv2.cvtColor(img, cv2.COLOR_RGB2GRAY) for img in X])

# Reshape to match CNN input (samples, height, width, channels)
X_gray = X_gray.reshape(X_gray.shape[0], X_gray.shape[1], X_gray.shape[2], 1)

# Confirm shape
print(f"X_gray shape: {X_gray.shape}")

X_gray shape: (631, 200, 200, 1)

# First split: 70% train, 30% temp (val+test)
X_train, X_temp, y_train, y_temp = train_test_split(
    X_gray, y, test_size=0.3, random_state=42, stratify=y
)

# Second split: 50% of the temp set goes to val, 50% to test
X_val, X_test, y_val, y_test = train_test_split(
    X_temp, y_temp, test_size=0.5, random_state=42, stratify=y_temp
)

print(f"Train set: {X_train.shape[0]}")
print(f"Validation set: {X_val.shape[0]}")
print(f"Test set: {X_test.shape[0]}")

Train set: 441
Validation set: 95
Test set: 95

# Since pixel values are currently in the range [0, 255] (as is typical for images), we’ll scale them to the range [0.0, 1.0] by dividing by 255
# Normalize grayscale pixel values to [0.0, 1.0]
X_train = X_train / 255.0
X_val = X_val / 255.0
X_test = X_test / 255.0

print(f"Train min: {X_train.min()}, max: {X_train.max()}")
print(f"Val min: {X_val.min()}, max: {X_val.max()}")
print(f"Test min: {X_test.min()}, max: {X_test.max()}")

Train min: 0.0, max: 1.0
Val min: 0.0, max: 1.0
Test min: 0.0, max: 1.0

# defining a function to compute different metrics to check performance of a classification model built using statsmodels
def model_performance_classification(model, predictors, target):
    """
    Function to compute different metrics to check classification model performance

    model: classifier
    predictors: independent variables
    target: dependent variable
    """

    # checking which probabilities are greater than threshold
    pred = model.predict(predictors).reshape(-1)>0.5

    target = target.to_numpy().reshape(-1)


    acc = accuracy_score(target, pred)  # to compute Accuracy
    recall = recall_score(target, pred, average='weighted')  # to compute Recall
    precision = precision_score(target, pred, average='weighted')  # to compute Precision
    f1 = f1_score(target, pred, average='weighted')  # to compute F1-score

    # creating a dataframe of metrics
    df_perf = pd.DataFrame({"Accuracy": acc, "Recall": recall, "Precision": precision, "F1 Score": f1,},index=[0],)

    return df_perf

def plot_confusion_matrix(model,predictors,target,ml=False):
    """
    Function to plot the confusion matrix

    model: classifier
    predictors: independent variables
    target: dependent variable
    ml: To specify if the model used is an sklearn ML model or not (True means ML model)
    """

    # checking which probabilities are greater than threshold
    pred = model.predict(predictors).reshape(-1)>0.5

    target = target.to_numpy().reshape(-1)

    # Plotting the Confusion Matrix using confusion matrix() function which is also predefined tensorflow module
    confusion_matrix = tf.math.confusion_matrix(target,pred)
    f, ax = plt.subplots(figsize=(10, 8))
    sns.heatmap(
        confusion_matrix,
        annot=True,
        linewidths=.4,
        fmt="d",
        square=True,
        ax=ax
    )
    plt.show()

# Define the CNN architecture
cnn_model_1 = Sequential([
    Conv2D(32, (3, 3), activation='relu', input_shape=X_train.shape[1:]),
    MaxPooling2D(pool_size=(2, 2)),

    Conv2D(64, (3, 3), activation='relu'),
    MaxPooling2D(pool_size=(2, 2)),

    Flatten(),
    Dense(128, activation='relu'),
    Dropout(0.5),
    Dense(1, activation='sigmoid')  # Output layer for binary classification
])

# Compile the model
cnn_model_1.compile(optimizer='adam',
                  loss='binary_crossentropy',
                  metrics=['accuracy'])

# Display model summary
cnn_model_1.summary()

Model: "sequential"

┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
│ conv2d (Conv2D)                 │ (None, 198, 198, 32)   │           320 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ max_pooling2d (MaxPooling2D)    │ (None, 99, 99, 32)     │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ conv2d_1 (Conv2D)               │ (None, 97, 97, 64)     │        18,496 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ max_pooling2d_1 (MaxPooling2D)  │ (None, 48, 48, 64)     │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ flatten (Flatten)               │ (None, 147456)         │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense (Dense)                   │ (None, 128)            │    18,874,496 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dropout (Dropout)               │ (None, 128)            │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_1 (Dense)                 │ (None, 1)              │           129 │
└─────────────────────────────────┴────────────────────────┴───────────────┘

 Total params: 18,893,441 (72.07 MB)

 Trainable params: 18,893,441 (72.07 MB)

 Non-trainable params: 0 (0.00 B)

history_1 = cnn_model_1.fit(
    X_train, y_train,
    validation_data=(X_val, y_val),
    epochs=10,
    batch_size=32,
    verbose=2
)

Epoch 1/10
14/14 - 16s - 1s/step - accuracy: 0.7234 - loss: 1.4835 - val_accuracy: 0.9263 - val_loss: 0.2959
Epoch 2/10
14/14 - 8s - 560ms/step - accuracy: 0.9478 - loss: 0.1686 - val_accuracy: 0.9684 - val_loss: 0.0770
Epoch 3/10
14/14 - 1s - 37ms/step - accuracy: 0.9773 - loss: 0.0854 - val_accuracy: 0.9684 - val_loss: 0.0719
Epoch 4/10
14/14 - 1s - 45ms/step - accuracy: 0.9796 - loss: 0.0612 - val_accuracy: 0.9789 - val_loss: 0.0673
Epoch 5/10
14/14 - 1s - 41ms/step - accuracy: 1.0000 - loss: 0.0128 - val_accuracy: 0.9895 - val_loss: 0.0780
Epoch 6/10
14/14 - 1s - 46ms/step - accuracy: 0.9977 - loss: 0.0106 - val_accuracy: 0.9684 - val_loss: 0.0837
Epoch 7/10
14/14 - 1s - 42ms/step - accuracy: 0.9955 - loss: 0.0170 - val_accuracy: 0.9895 - val_loss: 0.1037
Epoch 8/10
14/14 - 1s - 46ms/step - accuracy: 1.0000 - loss: 0.0055 - val_accuracy: 0.9789 - val_loss: 0.0870
Epoch 9/10
14/14 - 1s - 44ms/step - accuracy: 1.0000 - loss: 0.0045 - val_accuracy: 0.9895 - val_loss: 0.0966
Epoch 10/10
14/14 - 0s - 35ms/step - accuracy: 1.0000 - loss: 0.0027 - val_accuracy: 0.9789 - val_loss: 0.0900

plt.plot(history_1.history['accuracy'])
plt.plot(history_1.history['val_accuracy'])
plt.title('Model Accuracy over Epochs')
plt.ylabel('Accuracy')
plt.xlabel('Epoch')
plt.legend(['Train', 'Validation'], loc='upper left')
plt.show()

# Evaluate on Train Set
print("Train performance metrics:")
cnn_model_1_train_perf = model_performance_classification(cnn_model_1, X_train, pd.Series(y_train))
display(cnn_model_1_train_perf)

plot_confusion_matrix(cnn_model_1, X_train, pd.Series(y_train))

# Evaluate on Validation Set
print("Validation performance metrics:")
cnn_model_1_val_perf = model_performance_classification(cnn_model_1, X_val, pd.Series(y_val))
display(cnn_model_1_val_perf)

print("\n" + "=" * 60)
print("CONFUSION MATRIX")
print("=" * 60 + "\n") # print separator line

plot_confusion_matrix(cnn_model_1, X_val, pd.Series(y_val))

# Evaluate on Test Set
# print("Test performance metrics:")
# cnn_model_1_test_perf = model_performance_classification(cnn_model_1, X_test, pd.Series(y_test))
# display(cnn_model_1_test_perf)

# print("\n" + "=" * 60)
# print("CONFUSION MATRIX")
# print("=" * 60 + "\n") # print separator line

# plot_confusion_matrix(cnn_model_1, X_test, pd.Series(y_test))

Train performance metrics:
14/14 ━━━━━━━━━━━━━━━━━━━━ 1s 71ms/step

14/14 ━━━━━━━━━━━━━━━━━━━━ 0s 9ms/step

Validation performance metrics:
3/3 ━━━━━━━━━━━━━━━━━━━━ 0s 92ms/step

============================================================
CONFUSION MATRIX
============================================================

3/3 ━━━━━━━━━━━━━━━━━━━━ 0s 17ms/step

# Visualize and predict for index 12
index = 12
plt.figure(figsize=(2,2))
plt.imshow(X_val[index].reshape(X_val.shape[1], X_val.shape[2]), cmap='gray')
plt.title(f"Image at index {index}")
plt.axis('off')
plt.show()

# Make prediction
prediction = cnn_model_1.predict(X_val[index].reshape(1, X_val.shape[1], X_val.shape[2], 1))
predicted_label = 1 if prediction[0][0] > 0.5 else 0
print('Predicted Label:', predicted_label)
print('True Label:', y_val[index])

# Repeat for index 33
index = 33
plt.figure(figsize=(2,2))
plt.imshow(X_val[index].reshape(X_val.shape[1], X_val.shape[2]), cmap='gray')
plt.title(f"Image at index {index}")
plt.axis('off')
plt.show()

prediction = cnn_model_1.predict(X_val[index].reshape(1, X_val.shape[1], X_val.shape[2], 1))
predicted_label = 1 if prediction[0][0] > 0.5 else 0
print('Predicted Label:', predicted_label)
print('True Label:', y_val[index])

1/1 ━━━━━━━━━━━━━━━━━━━━ 1s 777ms/step
Predicted Label: 1
True Label: 1

1/1 ━━━━━━━━━━━━━━━━━━━━ 0s 29ms/step
Predicted Label: 0
True Label: 0

# Convert grayscale to RGB-like format for VGG (e.g., (128, 128, 1) → (128, 128, 3))
X_train_vgg = np.repeat(X_train, 3, axis=-1)
X_val_vgg = np.repeat(X_val, 3, axis=-1)
X_test_vgg = np.repeat(X_test, 3, axis=-1)

# Load base VGG16 model without top layer
vgg_base = VGG16(weights='imagenet', include_top=False, input_shape=X_train_vgg.shape[1:])

# Freeze all layers first
for layer in vgg_base.layers:
    layer.trainable = False

# Unfreeze the last 4 layers
for layer in vgg_base.layers[-4:]:
    layer.trainable = True

Downloading data from https://storage.googleapis.com/tensorflow/keras-applications/vgg16/vgg16_weights_tf_dim_ordering_tf_kernels_notop.h5
58889256/58889256 ━━━━━━━━━━━━━━━━━━━━ 2s 0us/step

# Add custom head
x = vgg_base.output
x = Flatten()(x)
x = Dense(128, activation='relu')(x)
x = Dropout(0.8)(x)
output = Dense(1, activation='sigmoid')(x)

# Define the final model
cnn_model_2 = Model(inputs=vgg_base.input, outputs=output)

cnn_model_2.compile(
    optimizer=Adam(learning_rate=0.000001),  # small LR is safer with pre-trained weights
    loss='binary_crossentropy',
    metrics=['accuracy']
)

cnn_model_2.summary()

Model: "functional_1"

┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
│ input_layer_1 (InputLayer)      │ (None, 200, 200, 3)    │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block1_conv1 (Conv2D)           │ (None, 200, 200, 64)   │         1,792 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block1_conv2 (Conv2D)           │ (None, 200, 200, 64)   │        36,928 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block1_pool (MaxPooling2D)      │ (None, 100, 100, 64)   │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block2_conv1 (Conv2D)           │ (None, 100, 100, 128)  │        73,856 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block2_conv2 (Conv2D)           │ (None, 100, 100, 128)  │       147,584 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block2_pool (MaxPooling2D)      │ (None, 50, 50, 128)    │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block3_conv1 (Conv2D)           │ (None, 50, 50, 256)    │       295,168 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block3_conv2 (Conv2D)           │ (None, 50, 50, 256)    │       590,080 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block3_conv3 (Conv2D)           │ (None, 50, 50, 256)    │       590,080 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block3_pool (MaxPooling2D)      │ (None, 25, 25, 256)    │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block4_conv1 (Conv2D)           │ (None, 25, 25, 512)    │     1,180,160 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block4_conv2 (Conv2D)           │ (None, 25, 25, 512)    │     2,359,808 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block4_conv3 (Conv2D)           │ (None, 25, 25, 512)    │     2,359,808 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block4_pool (MaxPooling2D)      │ (None, 12, 12, 512)    │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block5_conv1 (Conv2D)           │ (None, 12, 12, 512)    │     2,359,808 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block5_conv2 (Conv2D)           │ (None, 12, 12, 512)    │     2,359,808 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block5_conv3 (Conv2D)           │ (None, 12, 12, 512)    │     2,359,808 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block5_pool (MaxPooling2D)      │ (None, 6, 6, 512)      │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ flatten_1 (Flatten)             │ (None, 18432)          │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_2 (Dense)                 │ (None, 128)            │     2,359,424 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dropout_1 (Dropout)             │ (None, 128)            │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_3 (Dense)                 │ (None, 1)              │           129 │
└─────────────────────────────────┴────────────────────────┴───────────────┘

 Total params: 17,074,241 (65.13 MB)

 Trainable params: 9,438,977 (36.01 MB)

 Non-trainable params: 7,635,264 (29.13 MB)

history_2 = cnn_model_2.fit(
    X_train_vgg, y_train,
    validation_data=(X_val_vgg, y_val),
    epochs=10,
    batch_size=32,
    verbose=2
)

Epoch 1/10
14/14 - 40s - 3s/step - accuracy: 0.5193 - loss: 0.8675 - val_accuracy: 0.4632 - val_loss: 0.7061
Epoch 2/10
14/14 - 5s - 336ms/step - accuracy: 0.4943 - loss: 0.8529 - val_accuracy: 0.5368 - val_loss: 0.6603
Epoch 3/10
14/14 - 2s - 172ms/step - accuracy: 0.5692 - loss: 0.7801 - val_accuracy: 0.6421 - val_loss: 0.6178
Epoch 4/10
14/14 - 2s - 167ms/step - accuracy: 0.5692 - loss: 0.7798 - val_accuracy: 0.8421 - val_loss: 0.5777
Epoch 5/10
14/14 - 2s - 174ms/step - accuracy: 0.6259 - loss: 0.6870 - val_accuracy: 0.8842 - val_loss: 0.5420
Epoch 6/10
14/14 - 3s - 182ms/step - accuracy: 0.6712 - loss: 0.6239 - val_accuracy: 0.9263 - val_loss: 0.5094
Epoch 7/10
14/14 - 3s - 203ms/step - accuracy: 0.6735 - loss: 0.6096 - val_accuracy: 0.9474 - val_loss: 0.4782
Epoch 8/10
14/14 - 2s - 160ms/step - accuracy: 0.6667 - loss: 0.6114 - val_accuracy: 0.9474 - val_loss: 0.4485
Epoch 9/10
14/14 - 2s - 156ms/step - accuracy: 0.6916 - loss: 0.5909 - val_accuracy: 0.9684 - val_loss: 0.4187
Epoch 10/10
14/14 - 2s - 174ms/step - accuracy: 0.7415 - loss: 0.5101 - val_accuracy: 0.9789 - val_loss: 0.3907

plt.plot(history_2.history['accuracy'])
plt.plot(history_2.history['val_accuracy'])
plt.title('Model Accuracy over Epochs')
plt.ylabel('Accuracy')
plt.xlabel('Epoch')
plt.legend(['Train', 'Validation'], loc='upper left')
plt.show()

# Evaluate on Train Set
print("Train performance metrics:")
cnn_model_2_train_perf = model_performance_classification(cnn_model_2, X_train_vgg, pd.Series(y_train))
display(cnn_model_2_train_perf)

plot_confusion_matrix(cnn_model_2, X_train_vgg, pd.Series(y_train))

# Evaluate on Validation Set
print("Validation performance metrics:")
cnn_model_2_val_perf = model_performance_classification(cnn_model_2, X_val_vgg, pd.Series(y_val))
display(cnn_model_2_val_perf)

print("\n" + "=" * 60)
print("CONFUSION MATRIX")
print("=" * 60 + "\n")  # print separator line

plot_confusion_matrix(cnn_model_2, X_val_vgg, pd.Series(y_val))

# Hold off on Test Set — uncomment only when ready to evaluate final model
# print("Test performance metrics:")
# cnn_model_2_test_perf = model_performance_classification(cnn_model_2, X_test_vgg, pd.Series(y_test))
# display(cnn_model_2_test_perf)

# print("\n" + "=" * 60)
# print("CONFUSION MATRIX")
# print("=" * 60 + "\n")

# plot_confusion_matrix(cnn_model_2, X_test_vgg, pd.Series(y_test))

Train performance metrics:
14/14 ━━━━━━━━━━━━━━━━━━━━ 3s 173ms/step

14/14 ━━━━━━━━━━━━━━━━━━━━ 2s 105ms/step

Validation performance metrics:
3/3 ━━━━━━━━━━━━━━━━━━━━ 1s 243ms/step

============================================================
CONFUSION MATRIX
============================================================

3/3 ━━━━━━━━━━━━━━━━━━━━ 0s 113ms/step

print("Train:", np.bincount(y_train))
print("Val:", np.bincount(y_val))
print("Test:", np.bincount(y_test))

Train: [224 217]
Val: [48 47]
Test: [48 47]

# For index 12
index = 12
plt.figure(figsize=(2, 2))
plt.imshow(X_val[index].reshape(X_val.shape[1], X_val.shape[2]), cmap='gray')  # grayscale view
plt.title(f"Image at index {index}")
plt.axis('off')
plt.show()

# Predict using the RGB-converted version
prediction = cnn_model_2.predict(X_val_vgg[index].reshape(1, X_val.shape[1], X_val.shape[2], 3))
predicted_label = 1 if prediction[0][0] > 0.5 else 0
print('Predicted Label:', predicted_label)
print('True Label:', y_val[index])

# For index 33
index = 33
plt.figure(figsize=(2, 2))
plt.imshow(X_val[index].reshape(X_val.shape[1], X_val.shape[2]), cmap='gray')  # grayscale view
plt.title(f"Image at index {index}")
plt.axis('off')
plt.show()

prediction = cnn_model_2.predict(X_val_vgg[index].reshape(1, X_val.shape[1], X_val.shape[2], 3))
predicted_label = 1 if prediction[0][0] > 0.5 else 0
print('Predicted Label:', predicted_label)
print('True Label:', y_val[index])

1/1 ━━━━━━━━━━━━━━━━━━━━ 2s 2s/step
Predicted Label: 1
True Label: 1

1/1 ━━━━━━━━━━━━━━━━━━━━ 0s 45ms/step
Predicted Label: 0
True Label: 0

# Convert grayscale to RGB-like format for VGG (e.g., (128, 128, 1) → (128, 128, 3))
X_train_vgg = np.repeat(X_train, 3, axis=-1)
X_val_vgg = np.repeat(X_val, 3, axis=-1)
X_test_vgg = np.repeat(X_test, 3, axis=-1)

# Load base VGG16 model without top layer
vgg_base = VGG16(weights='imagenet', include_top=False, input_shape=X_train_vgg.shape[1:])

# Freeze all layers first
for layer in vgg_base.layers:
    layer.trainable = False

# Unfreeze the last 4 layers
# for layer in vgg_base.layers[-4:]:
#   layer.trainable = True

# Add a Deeper FFNN Head
x = vgg_base.output
x = Flatten()(x)
x = Dense(256, activation='relu')(x)
x = Dropout(0.7)(x)
x = Dense(128, activation='relu')(x)
x = Dropout(0.8)(x)
output = Dense(1, activation='sigmoid')(x)

# Define the final model
cnn_model_3 = Model(inputs=vgg_base.input, outputs=output)

cnn_model_3.compile(
    optimizer=Adam(learning_rate=0.00001),  # small LR is safer with pre-trained weights
    loss='binary_crossentropy',
    metrics=['accuracy']
)

cnn_model_3.summary()

Model: "functional_2"

┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
│ input_layer_2 (InputLayer)      │ (None, 200, 200, 3)    │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block1_conv1 (Conv2D)           │ (None, 200, 200, 64)   │         1,792 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block1_conv2 (Conv2D)           │ (None, 200, 200, 64)   │        36,928 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block1_pool (MaxPooling2D)      │ (None, 100, 100, 64)   │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block2_conv1 (Conv2D)           │ (None, 100, 100, 128)  │        73,856 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block2_conv2 (Conv2D)           │ (None, 100, 100, 128)  │       147,584 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block2_pool (MaxPooling2D)      │ (None, 50, 50, 128)    │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block3_conv1 (Conv2D)           │ (None, 50, 50, 256)    │       295,168 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block3_conv2 (Conv2D)           │ (None, 50, 50, 256)    │       590,080 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block3_conv3 (Conv2D)           │ (None, 50, 50, 256)    │       590,080 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block3_pool (MaxPooling2D)      │ (None, 25, 25, 256)    │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block4_conv1 (Conv2D)           │ (None, 25, 25, 512)    │     1,180,160 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block4_conv2 (Conv2D)           │ (None, 25, 25, 512)    │     2,359,808 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block4_conv3 (Conv2D)           │ (None, 25, 25, 512)    │     2,359,808 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block4_pool (MaxPooling2D)      │ (None, 12, 12, 512)    │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block5_conv1 (Conv2D)           │ (None, 12, 12, 512)    │     2,359,808 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block5_conv2 (Conv2D)           │ (None, 12, 12, 512)    │     2,359,808 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block5_conv3 (Conv2D)           │ (None, 12, 12, 512)    │     2,359,808 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block5_pool (MaxPooling2D)      │ (None, 6, 6, 512)      │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ flatten_2 (Flatten)             │ (None, 18432)          │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_4 (Dense)                 │ (None, 256)            │     4,718,848 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dropout_2 (Dropout)             │ (None, 256)            │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_5 (Dense)                 │ (None, 128)            │        32,896 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dropout_3 (Dropout)             │ (None, 128)            │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_6 (Dense)                 │ (None, 1)              │           129 │
└─────────────────────────────────┴────────────────────────┴───────────────┘

 Total params: 19,466,561 (74.26 MB)

 Trainable params: 4,751,873 (18.13 MB)

 Non-trainable params: 14,714,688 (56.13 MB)

history_3 = cnn_model_3.fit(
    X_train_vgg, y_train,
    validation_data=(X_val_vgg, y_val),
    epochs=10,
    batch_size=32,
    verbose=2
)

Epoch 1/10
14/14 - 10s - 689ms/step - accuracy: 0.5238 - loss: 1.1254 - val_accuracy: 0.8421 - val_loss: 0.5862
Epoch 2/10
14/14 - 2s - 148ms/step - accuracy: 0.5828 - loss: 1.0004 - val_accuracy: 0.9053 - val_loss: 0.5168
Epoch 3/10
14/14 - 2s - 129ms/step - accuracy: 0.5873 - loss: 0.8331 - val_accuracy: 0.8842 - val_loss: 0.4711
Epoch 4/10
14/14 - 3s - 182ms/step - accuracy: 0.5782 - loss: 0.7858 - val_accuracy: 0.9263 - val_loss: 0.4357
Epoch 5/10
14/14 - 2s - 178ms/step - accuracy: 0.6372 - loss: 0.7254 - val_accuracy: 0.9474 - val_loss: 0.3974
Epoch 6/10
14/14 - 3s - 183ms/step - accuracy: 0.6712 - loss: 0.6407 - val_accuracy: 0.9789 - val_loss: 0.3624
Epoch 7/10
14/14 - 2s - 149ms/step - accuracy: 0.7347 - loss: 0.5550 - val_accuracy: 0.9789 - val_loss: 0.3373
Epoch 8/10
14/14 - 2s - 128ms/step - accuracy: 0.7324 - loss: 0.5385 - val_accuracy: 0.9789 - val_loss: 0.3166
Epoch 9/10
14/14 - 3s - 183ms/step - accuracy: 0.7619 - loss: 0.4887 - val_accuracy: 0.9895 - val_loss: 0.2904
Epoch 10/10
14/14 - 2s - 153ms/step - accuracy: 0.7982 - loss: 0.4486 - val_accuracy: 0.9895 - val_loss: 0.2680

plt.plot(history_3.history['accuracy'])
plt.plot(history_3.history['val_accuracy'])
plt.title('Model Accuracy over Epochs')
plt.ylabel('Accuracy')
plt.xlabel('Epoch')
plt.legend(['Train', 'Validation'], loc='upper left')
plt.show()

print("Train performance metrics:")
cnn_model_3_train_perf = model_performance_classification(cnn_model_3, X_train_vgg, pd.Series(y_train))
display(cnn_model_3_train_perf)

plot_confusion_matrix(cnn_model_3, X_train_vgg, pd.Series(y_train))

print("\nValidation performance metrics:")
cnn_model_3_val_perf = model_performance_classification(cnn_model_3, X_val_vgg, pd.Series(y_val))
display(cnn_model_3_val_perf)

print("\n" + "="*60)
plot_confusion_matrix(cnn_model_3, X_val_vgg, pd.Series(y_val))

Train performance metrics:
14/14 ━━━━━━━━━━━━━━━━━━━━ 2s 140ms/step

14/14 ━━━━━━━━━━━━━━━━━━━━ 1s 103ms/step

Validation performance metrics:
3/3 ━━━━━━━━━━━━━━━━━━━━ 1s 241ms/step

============================================================
3/3 ━━━━━━━━━━━━━━━━━━━━ 0s 110ms/step

print("Train:", np.bincount(y_train))
print("Val:", np.bincount(y_val))
print("Test:", np.bincount(y_test))

Train: [224 217]
Val: [48 47]
Test: [48 47]

# For index 12
index = 12
plt.figure(figsize=(2, 2))
plt.imshow(X_val[index].reshape(X_val.shape[1], X_val.shape[2]), cmap='gray')  # grayscale view
plt.title(f"Image at index {index}")
plt.axis('off')
plt.show()

# Predict using the RGB-converted version
prediction = cnn_model_2.predict(X_val_vgg[index].reshape(1, X_val.shape[1], X_val.shape[2], 3))
predicted_label = 1 if prediction[0][0] > 0.5 else 0
print('Predicted Label:', predicted_label)
print('True Label:', y_val[index])

# For index 33
index = 33
plt.figure(figsize=(2, 2))
plt.imshow(X_val[index].reshape(X_val.shape[1], X_val.shape[2]), cmap='gray')  # grayscale view
plt.title(f"Image at index {index}")
plt.axis('off')
plt.show()

prediction = cnn_model_2.predict(X_val_vgg[index].reshape(1, X_val.shape[1], X_val.shape[2], 3))
predicted_label = 1 if prediction[0][0] > 0.5 else 0
print('Predicted Label:', predicted_label)
print('True Label:', y_val[index])

1/1 ━━━━━━━━━━━━━━━━━━━━ 0s 51ms/step
Predicted Label: 1
True Label: 1

1/1 ━━━━━━━━━━━━━━━━━━━━ 0s 51ms/step
Predicted Label: 0
True Label: 0

# Convert grayscale to RGB-like format for VGG (e.g., (128, 128, 1) → (128, 128, 3))
X_train_vgg = np.repeat(X_train, 3, axis=-1)
X_val_vgg = np.repeat(X_val, 3, axis=-1)
X_test_vgg = np.repeat(X_test, 3, axis=-1)

# Data augmentation only applied to training data
train_datagen = ImageDataGenerator(
    rotation_range=15,
    width_shift_range=0.1,
    height_shift_range=0.1,
    zoom_range=0.1,
    horizontal_flip=True,
    fill_mode='nearest'
)

# Validation/Test generators (no augmentation)
val_datagen = ImageDataGenerator()

# Flow from arrays
train_generator = train_datagen.flow(X_train_vgg, y_train, batch_size=32)
val_generator = val_datagen.flow(X_val_vgg, y_val, batch_size=32)

vgg_base = VGG16(weights='imagenet', include_top=False, input_shape=X_train_vgg.shape[1:])
for layer in vgg_base.layers:
    layer.trainable = False

x = vgg_base.output
x = Flatten()(x)
x = Dense(256, activation='relu')(x)
x = Dropout(0.7)(x)
x = Dense(128, activation='relu')(x)
x = Dropout(0.8)(x)
output = Dense(1, activation='sigmoid')(x)

cnn_model_4 = Model(inputs=vgg_base.input, outputs=output)

# Define the final model
cnn_model_4 = Model(inputs=vgg_base.input, outputs=output)

cnn_model_4.compile(
    optimizer=Adam(learning_rate=0.000001),  # small LR is safer with pre-trained weights
    loss='binary_crossentropy',
    metrics=['accuracy']
)

cnn_model_4.summary()

Model: "functional_4"

┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━┓
┃ Layer (type)                    ┃ Output Shape           ┃       Param # ┃
┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━┩
│ input_layer_3 (InputLayer)      │ (None, 200, 200, 3)    │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block1_conv1 (Conv2D)           │ (None, 200, 200, 64)   │         1,792 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block1_conv2 (Conv2D)           │ (None, 200, 200, 64)   │        36,928 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block1_pool (MaxPooling2D)      │ (None, 100, 100, 64)   │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block2_conv1 (Conv2D)           │ (None, 100, 100, 128)  │        73,856 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block2_conv2 (Conv2D)           │ (None, 100, 100, 128)  │       147,584 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block2_pool (MaxPooling2D)      │ (None, 50, 50, 128)    │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block3_conv1 (Conv2D)           │ (None, 50, 50, 256)    │       295,168 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block3_conv2 (Conv2D)           │ (None, 50, 50, 256)    │       590,080 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block3_conv3 (Conv2D)           │ (None, 50, 50, 256)    │       590,080 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block3_pool (MaxPooling2D)      │ (None, 25, 25, 256)    │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block4_conv1 (Conv2D)           │ (None, 25, 25, 512)    │     1,180,160 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block4_conv2 (Conv2D)           │ (None, 25, 25, 512)    │     2,359,808 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block4_conv3 (Conv2D)           │ (None, 25, 25, 512)    │     2,359,808 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block4_pool (MaxPooling2D)      │ (None, 12, 12, 512)    │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block5_conv1 (Conv2D)           │ (None, 12, 12, 512)    │     2,359,808 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block5_conv2 (Conv2D)           │ (None, 12, 12, 512)    │     2,359,808 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block5_conv3 (Conv2D)           │ (None, 12, 12, 512)    │     2,359,808 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ block5_pool (MaxPooling2D)      │ (None, 6, 6, 512)      │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ flatten_3 (Flatten)             │ (None, 18432)          │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_7 (Dense)                 │ (None, 256)            │     4,718,848 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dropout_4 (Dropout)             │ (None, 256)            │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_8 (Dense)                 │ (None, 128)            │        32,896 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dropout_5 (Dropout)             │ (None, 128)            │             0 │
├─────────────────────────────────┼────────────────────────┼───────────────┤
│ dense_9 (Dense)                 │ (None, 1)              │           129 │
└─────────────────────────────────┴────────────────────────┴───────────────┘

 Total params: 19,466,561 (74.26 MB)

 Trainable params: 4,751,873 (18.13 MB)

 Non-trainable params: 14,714,688 (56.13 MB)

history_4 = cnn_model_4.fit(
    train_generator,
    validation_data=val_generator,
    epochs=10,
    verbose=2
)

Epoch 1/10
14/14 - 11s - 774ms/step - accuracy: 0.4830 - loss: 1.4582 - val_accuracy: 0.5368 - val_loss: 0.7142
Epoch 2/10
14/14 - 4s - 301ms/step - accuracy: 0.5079 - loss: 1.4118 - val_accuracy: 0.5579 - val_loss: 0.7033
Epoch 3/10
14/14 - 6s - 395ms/step - accuracy: 0.4512 - loss: 1.4290 - val_accuracy: 0.6000 - val_loss: 0.6919
Epoch 4/10
14/14 - 4s - 302ms/step - accuracy: 0.5283 - loss: 1.2546 - val_accuracy: 0.6105 - val_loss: 0.6822
Epoch 5/10
14/14 - 5s - 334ms/step - accuracy: 0.4875 - loss: 1.4474 - val_accuracy: 0.6211 - val_loss: 0.6721
Epoch 6/10
14/14 - 5s - 357ms/step - accuracy: 0.4966 - loss: 1.2656 - val_accuracy: 0.6421 - val_loss: 0.6630
Epoch 7/10
14/14 - 4s - 308ms/step - accuracy: 0.5374 - loss: 1.3086 - val_accuracy: 0.6737 - val_loss: 0.6548
Epoch 8/10
14/14 - 5s - 387ms/step - accuracy: 0.5147 - loss: 1.2220 - val_accuracy: 0.6947 - val_loss: 0.6476
Epoch 9/10
14/14 - 9s - 646ms/step - accuracy: 0.5125 - loss: 1.1905 - val_accuracy: 0.7158 - val_loss: 0.6400
Epoch 10/10
14/14 - 5s - 392ms/step - accuracy: 0.5011 - loss: 1.2730 - val_accuracy: 0.7579 - val_loss: 0.6321

plt.plot(history_4.history['accuracy'])
plt.plot(history_4.history['val_accuracy'])
plt.title('Model Accuracy over Epochs')
plt.ylabel('Accuracy')
plt.xlabel('Epoch')
plt.legend(['Train', 'Validation'], loc='upper left')
plt.show()

# Predict on training and validation sets manually
train_preds = cnn_model_4.predict(X_train_vgg)
val_preds = cnn_model_4.predict(X_val_vgg)

# Convert probabilities to binary predictions
train_preds_bin = (train_preds > 0.5).astype(int)
val_preds_bin = (val_preds > 0.5).astype(int)

# Evaluate using  utility functions
print("Training performance:")
print(classification_report(y_train, train_preds_bin))

print("\nValidation performance:")
print(classification_report(y_val, val_preds_bin))

print("\nValidation Confusion Matrix:")
plot_confusion_matrix(cnn_model_4, X_val_vgg, pd.Series(y_val))

14/14 ━━━━━━━━━━━━━━━━━━━━ 2s 147ms/step
3/3 ━━━━━━━━━━━━━━━━━━━━ 1s 263ms/step
Training performance:
              precision    recall  f1-score   support

           0       0.66      0.97      0.79       224
           1       0.94      0.49      0.65       217

    accuracy                           0.73       441
   macro avg       0.80      0.73      0.72       441
weighted avg       0.80      0.73      0.72       441


Validation performance:
              precision    recall  f1-score   support

           0       0.69      0.96      0.80        48
           1       0.93      0.55      0.69        47

    accuracy                           0.76        95
   macro avg       0.81      0.76      0.75        95
weighted avg       0.81      0.76      0.75        95


Validation Confusion Matrix:
3/3 ━━━━━━━━━━━━━━━━━━━━ 0s 115ms/step

print("Train:", np.bincount(y_train))
print("Val:", np.bincount(y_val))
print("Test:", np.bincount(y_test))

Train: [224 217]
Val: [48 47]
Test: [48 47]

# For index 12
index = 12
plt.figure(figsize=(2, 2))
plt.imshow(X_val[index].reshape(X_val.shape[1], X_val.shape[2]), cmap='gray')  # grayscale view
plt.title(f"Image at index {index}")
plt.axis('off')
plt.show()

# Predict using the RGB-converted version
prediction = cnn_model_2.predict(X_val_vgg[index].reshape(1, X_val.shape[1], X_val.shape[2], 3))
predicted_label = 1 if prediction[0][0] > 0.5 else 0
print('Predicted Label:', predicted_label)
print('True Label:', y_val[index])

# For index 33
index = 33
plt.figure(figsize=(2, 2))
plt.imshow(X_val[index].reshape(X_val.shape[1], X_val.shape[2]), cmap='gray')  # grayscale view
plt.title(f"Image at index {index}")
plt.axis('off')
plt.show()

prediction = cnn_model_2.predict(X_val_vgg[index].reshape(1, X_val.shape[1], X_val.shape[2], 3))
predicted_label = 1 if prediction[0][0] > 0.5 else 0
print('Predicted Label:', predicted_label)
print('True Label:', y_val[index])

1/1 ━━━━━━━━━━━━━━━━━━━━ 0s 50ms/step
Predicted Label: 1
True Label: 1

1/1 ━━━━━━━━━━━━━━━━━━━━ 0s 50ms/step
Predicted Label: 0
True Label: 0

cnn_model_4_val_perf = pd.DataFrame({
    "Accuracy": [accuracy_score(y_val, val_preds_bin)],
    "Recall": [recall_score(y_val, val_preds_bin)],
    "Precision": [precision_score(y_val, val_preds_bin)],
    "F1 Score": [f1_score(y_val, val_preds_bin)]
})

# Create a summary DataFrame
comparison_df = pd.DataFrame({
    "Model": [
        "cnn_model_1 (Basic CNN)",
        "cnn_model_2 (VGG-16 Base)",
        "cnn_model_3 (VGG-16 + FFNN)",
        "cnn_model_4 (VGG-16 + FFNN + Aug)"
    ],
    "Accuracy": [
        cnn_model_1_val_perf["Accuracy"].values[0],
        cnn_model_2_val_perf["Accuracy"].values[0],
        cnn_model_3_val_perf["Accuracy"].values[0],
        cnn_model_4_val_perf["Accuracy"].values[0]
    ],
    "Precision": [
        cnn_model_1_val_perf["Precision"].values[0],
        cnn_model_2_val_perf["Precision"].values[0],
        cnn_model_3_val_perf["Precision"].values[0],
        cnn_model_4_val_perf["Precision"].values[0]
    ],
    "Recall": [
        cnn_model_1_val_perf["Recall"].values[0],
        cnn_model_2_val_perf["Recall"].values[0],
        cnn_model_3_val_perf["Recall"].values[0],
        cnn_model_4_val_perf["Recall"].values[0]
    ],
    "F1 Score": [
        cnn_model_1_val_perf["F1 Score"].values[0],
        cnn_model_2_val_perf["F1 Score"].values[0],
        cnn_model_3_val_perf["F1 Score"].values[0],
        cnn_model_4_val_perf["F1 Score"].values[0]
    ]
})

# Display the comparison
comparison_df.sort_values(by="Accuracy", ascending=False)

# Confirm test data shape for VGG-16
print(X_test_vgg.shape)  # should be (95, height, width, 3)

(95, 200, 200, 3)

print("Final Model (cnn_model_3) - Test Set Performance")
cnn_model_3_test_perf = model_performance_classification(cnn_model_3, X_test_vgg, pd.Series(y_test))
display(cnn_model_3_test_perf)

print("\n" + "=" * 60)
print("TEST CONFUSION MATRIX")
print("=" * 60 + "\n")

plot_confusion_matrix(cnn_model_3, X_test_vgg, pd.Series(y_test))

Final Model (cnn_model_3) - Test Set Performance
3/3 ━━━━━━━━━━━━━━━━━━━━ 1s 126ms/step

============================================================
TEST CONFUSION MATRIX
============================================================

3/3 ━━━━━━━━━━━━━━━━━━━━ 0s 107ms/step

# For grayscale input model
y_pred_probs = cnn_model_1.predict(X_val)
y_pred_labels = (y_pred_probs > 0.5).astype(int).reshape(-1)

# If your model uses RGB (e.g., VGG16-based)
# y_pred_probs = cnn_model_2.predict(X_val_vgg)
# y_pred_labels = (y_pred_probs > 0.5).astype(int).reshape(-1)

3/3 ━━━━━━━━━━━━━━━━━━━━ 0s 17ms/step

# Get true labels
y_true = y_val if isinstance(y_val, np.ndarray) else y_val.to_numpy()

# Find misclassified indexes
misclassified_idxs = np.where(y_pred_labels != y_true)[0]
print(f"Total misclassifications: {len(misclassified_idxs)}")

Total misclassifications: 2

# Show a few misclassified images
plt.figure(figsize=(12, 6))
for i, idx in enumerate(misclassified_idxs[:5]):
    plt.subplot(1, 5, i+1)
    image = X_val[idx].reshape(X_val.shape[1], X_val.shape[2])
    plt.imshow(image, cmap='gray')
    plt.title(f"Pred: {y_pred_labels[idx]}, True: {y_true[idx]}")
    plt.axis('off')
plt.tight_layout()
plt.show()

print("Classification Report:")
print(classification_report(y_true, y_pred_labels, target_names=["No Helmet", "Helmet"]))

print("\nConfusion Matrix:")
print(confusion_matrix(y_true, y_pred_labels))

Classification Report:
              precision    recall  f1-score   support

   No Helmet       0.98      0.98      0.98        48
      Helmet       0.98      0.98      0.98        47

    accuracy                           0.98        95
   macro avg       0.98      0.98      0.98        95
weighted avg       0.98      0.98      0.98        95


Confusion Matrix:
[[47  1]
 [ 1 46]]

error_data = pd.DataFrame({
    "Index": misclassified_idxs,
    "Predicted": y_pred_labels[misclassified_idxs],
    "Actual": y_true[misclassified_idxs],
    "Confidence": y_pred_probs[misclassified_idxs].reshape(-1)
})

display(error_data.head())

print("\n" + "=" * 60)
print("RUBRIC CHECKLIST")
print("=" * 60 + "\n")

============================================================
RUBRIC CHECKLIST
============================================================

print("\n" + "=" * 60)
print("RUBRIC CHECKLIST END")
print("=" * 60 + "\n")

============================================================
RUBRIC CHECKLIST END
============================================================

!jupyter nbconvert --to html "drive/MyDrive/Colab Notebooks/Project 6/HelmNet_Full_Code_Thomas_Hall.ipynb"

# List files in Directory Project 6
import os
os.listdir("drive/MyDrive/Colab Notebooks/Project 6")

['HelmNet_images_proj.npy',
 'HelmNet_Labels_proj.csv',
 'HelmNet_Low_Code-1.ipynb',
 'Introduction to Computer Vision-Project Presentation Template.pptx']

# Prompt for download.
from google.colab import files
files.download('drive/MyDrive/Colab Notebooks/Project 6/HelmNet_Full_Code_Thomas_Hall.html')

Dataset	Portion	Formula	Approx Count (from 631 total)
Train	70%	0.70 × 631 = \441	✅ `X_train.shape[0]` ≈ 441
Validation	15%	0.15 × 631 = \94–95	✅ `X_val.shape[0]` ≈ 95
Test	15%	0.15 × 631 = \94–95	✅ `X_test.shape[0]` ≈ 95

	Model	Accuracy	Precision	Recall	F1 Score
2	cnn_model_3 (VGG-16 + FFNN)	0.989474	0.989689	0.989474	0.989471
0	cnn_model_1 (Basic CNN)	0.978947	0.978947	0.978947	0.978947
1	cnn_model_2 (VGG-16 Base)	0.978947	0.979807	0.978947	0.978943
3	cnn_model_4 (VGG-16 + FFNN + Aug)	0.757895	0.928571	0.553191	0.693333

	Index	Predicted	Actual	Confidence
0	10	1	0	0.997965
1	55	0	1	0.103166

Executive Summary¶

Problem Statement¶

Business Context¶

Objective¶

Data Description¶

Installing and Importing the Necessary Libraries¶

Data Overview¶

Connect to Google Drive¶

Loading the image data and labels¶

Convert Labels to Numpy Array¶

Exploratory Data Analysis¶

Check for class imbalance¶

Plot 5 random images for each class and print their corresponding labels.¶

Data Preprocessing¶

Converting images to grayscale¶

Splitting the dataset 70/15/15 split for Train/Validation/Test¶

Final Ratios:¶

Data Normalization¶

Validate Normalization:¶

Model Building¶

Model Evaluation Criterion¶

Utility Functions¶

model_performance_classification(...)¶

Purpose:¶

plot_confusion_matrix(...)¶

Purpose:¶

Model 1: Simple Convolutional Neural Network (CNN)¶

Model 1: Train the Model¶

Vizualizing the predictions¶

Model 2: (VGG-16 (Base))¶

Load VGG16 without the top classifier¶

Add Custom Classification Head¶

Compile the Model¶

Train the Model¶

Evaluate on Train & Validation Only¶

Print class distributions to ensure my data is still balanced due to high scores.¶

Vizualizing the predictions¶

Model 3: (VGG-16 (Base + FFNN))¶

Load VGG16 without the top classifier¶

Add a Deeper FFNN Head¶

Compile the Model¶

Train the Model¶

Evaluate on Train & Validation Only (NOT test yet!)¶

Print class distributions to ensure my data is still balanced due to high scores.¶

Vizualizing the predictions¶

Model 4: (VGG-16 (Base + FFNN + Data Augmentation)¶

Define ImageDataGenerator for Augmentation¶

Load VGG16 without the top classifier (reuse from cnn_model_3)¶

Compile the Model¶

Train the Model¶

Evaluate on Train & Validation Only (NOT test yet!)¶

Print class distributions to ensure my data is still balanced due to high scores.¶

Vizualizing the predictions¶

Model Performance Comparison and Final Model Selection¶

Create a Comparison Table¶

Test Performance¶

Prepare Test Data¶

Evaluate on Test Set¶

Interpret the Results¶

Perform Error Analysis¶

Actionable Insights & Recommendations¶

✅ Rubric Checklist¶

Convert Notebook to HTML using NbConvert¶