from keras import datasets
(X_train, y_train), (X_test, y_test) = datasets.cifar10.load_data()
print('Training data:')
print(f'\tX_train: {X_train.shape}, y_train {y_train.shape}')
print('Test data:')
print(f'\tX_test: {X_test.shape}, y_test {y_test.shape}')

Downloading data from https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz
170498071/170498071 ━━━━━━━━━━━━━━━━━━━━ 4s 0us/step
Training data:
	X_train: (50000, 32, 32, 3), y_train (50000, 1)
Test data:
	X_test: (10000, 32, 32, 3), y_test (10000, 1)

import pandas as pd

classes = ['airplane', 'automobile', 'bird', 'cat', 'deer', 'dog', 'frog', 'horse','ship','truck']
pd.DataFrame([[c, n] for c,n in enumerate(classes)], columns=['Class', 'Name'])

import numpy as np
import matplotlib.pyplot as plt

def displayImage(images, labels, nCols=10):
    """Displays images with labels (nCols per row)"""
    nRows = np.ceil(len(labels)/nCols).astype('int') # number of rows
    plt.figure(figsize=(2*nCols,2*nRows)) # figure size
    for i in range(len(labels)):
        plt.subplot(nRows,nCols,i+1)
        plt.xticks([])
        plt.yticks([])
        plt.grid(False)
        plt.imshow(images[i])
        plt.xlabel(str(labels[i]), fontsize=10)
    plt.show()
    return

k = 10
first_ten_indices_per_class = []
for class_label in range(10):
    indices = np.where(y_train == class_label)[0][:k]
    first_ten_indices_per_class.extend(indices)

images = X_train[first_ten_indices_per_class]
labels = [classes[c[0]] for c in y_train[first_ten_indices_per_class]]

SHOW_IMAGES = True # change to True to see images
if SHOW_IMAGES:
    displayImage(images, labels, k)

# import necessary libraries
import keras
from keras import layers, models, optimizers

# create model
model = models.Sequential()  # Sequential model

# Input layer matching the shape of input data
model.add(keras.Input(shape=X_train.shape[1:]))

# Conv Block 1
model.add(layers.Conv2D(32, (3, 3), activation=layers.LeakyReLU(alpha=0.1), padding='same', name="Conv1"))
model.add(layers.BatchNormalization())
model.add(layers.Conv2D(32, (3, 3), activation=layers.LeakyReLU(alpha=0.1), padding='same', name="Conv2"))
model.add(layers.BatchNormalization())
model.add(layers.MaxPooling2D((2, 2)))
model.add(layers.Dropout(0.2))

# Conv Block 2
model.add(layers.Conv2D(64, (3, 3), activation=layers.LeakyReLU(alpha=0.1), padding='same', name="Conv3"))
model.add(layers.BatchNormalization())
model.add(layers.Conv2D(64, (3, 3), activation=layers.LeakyReLU(alpha=0.1), padding='same', name="Conv4"))
model.add(layers.BatchNormalization())
model.add(layers.MaxPooling2D((2, 2)))
model.add(layers.Dropout(0.3))

# Conv Block 3
model.add(layers.Conv2D(128, (3, 3), activation=layers.LeakyReLU(alpha=0.1), padding='same', name="Conv5"))
model.add(layers.BatchNormalization())
model.add(layers.Conv2D(128, (3, 3), activation=layers.LeakyReLU(alpha=0.1), padding='same', name="Conv6"))
model.add(layers.BatchNormalization())
model.add(layers.MaxPooling2D((2, 2)))
model.add(layers.Dropout(0.4))

# Flatten the outputs to feed into dense layer
model.add(layers.Flatten())

# Dense (fully connected) layers
model.add(layers.Dense(512, activation=layers.LeakyReLU(alpha=0.1), name="Dense"))
model.add(layers.BatchNormalization())
model.add(layers.Dropout(0.4))

# Output layer with softmax for 10 classes
model.add(layers.Dense(10, activation='softmax', name="output"))

# Compile model using Adam optimizer
opt = optimizers.Adam(learning_rate=0.001)
model.compile(optimizer=opt, loss='categorical_crossentropy', metrics=['accuracy'])

# Display model summary
print(model.summary())

/usr/local/lib/python3.11/dist-packages/keras/src/layers/activations/leaky_relu.py:41: UserWarning: Argument `alpha` is deprecated. Use `negative_slope` instead.
  warnings.warn(

Model: "sequential"

┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
┃ Layer (type)                         ┃ Output Shape                ┃         Param # ┃
┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
│ Conv1 (Conv2D)                       │ (None, 32, 32, 32)          │             896 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ batch_normalization                  │ (None, 32, 32, 32)          │             128 │
│ (BatchNormalization)                 │                             │                 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ Conv2 (Conv2D)                       │ (None, 32, 32, 32)          │           9,248 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ batch_normalization_1                │ (None, 32, 32, 32)          │             128 │
│ (BatchNormalization)                 │                             │                 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ max_pooling2d (MaxPooling2D)         │ (None, 16, 16, 32)          │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dropout (Dropout)                    │ (None, 16, 16, 32)          │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ Conv3 (Conv2D)                       │ (None, 16, 16, 64)          │          18,496 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ batch_normalization_2                │ (None, 16, 16, 64)          │             256 │
│ (BatchNormalization)                 │                             │                 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ Conv4 (Conv2D)                       │ (None, 16, 16, 64)          │          36,928 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ batch_normalization_3                │ (None, 16, 16, 64)          │             256 │
│ (BatchNormalization)                 │                             │                 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ max_pooling2d_1 (MaxPooling2D)       │ (None, 8, 8, 64)            │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dropout_1 (Dropout)                  │ (None, 8, 8, 64)            │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ Conv5 (Conv2D)                       │ (None, 8, 8, 128)           │          73,856 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ batch_normalization_4                │ (None, 8, 8, 128)           │             512 │
│ (BatchNormalization)                 │                             │                 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ Conv6 (Conv2D)                       │ (None, 8, 8, 128)           │         147,584 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ batch_normalization_5                │ (None, 8, 8, 128)           │             512 │
│ (BatchNormalization)                 │                             │                 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ max_pooling2d_2 (MaxPooling2D)       │ (None, 4, 4, 128)           │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dropout_2 (Dropout)                  │ (None, 4, 4, 128)           │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ flatten (Flatten)                    │ (None, 2048)                │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ Dense (Dense)                        │ (None, 512)                 │       1,049,088 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ batch_normalization_6                │ (None, 512)                 │           2,048 │
│ (BatchNormalization)                 │                             │                 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dropout_3 (Dropout)                  │ (None, 512)                 │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ output (Dense)                       │ (None, 10)                  │           5,130 │
└──────────────────────────────────────┴─────────────────────────────┴─────────────────┘

 Total params: 1,345,066 (5.13 MB)

 Trainable params: 1,343,146 (5.12 MB)

 Non-trainable params: 1,920 (7.50 KB)

None

# Import the necessary utility
from tensorflow.keras.utils import to_categorical

epochs = 40           # number of training epochs
batch_size = 128      # batch size for training

# Train the model
history = model.fit(
    X_train / 255.0,                      # normalize input images
    to_categorical(y_train),             # one-hot encode labels
    epochs=epochs,
    batch_size=batch_size,
    validation_split=0.1                 # use 10% of training data for validation
)

Epoch 1/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 28s 42ms/step - accuracy: 0.3643 - loss: 2.0671 - val_accuracy: 0.2438 - val_loss: 2.2031
Epoch 2/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 14ms/step - accuracy: 0.5920 - loss: 1.1562 - val_accuracy: 0.6798 - val_loss: 0.9196
Epoch 3/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 14ms/step - accuracy: 0.6788 - loss: 0.9096 - val_accuracy: 0.7252 - val_loss: 0.7947
Epoch 4/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 14ms/step - accuracy: 0.7231 - loss: 0.7892 - val_accuracy: 0.7478 - val_loss: 0.7366
Epoch 5/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 10s 14ms/step - accuracy: 0.7480 - loss: 0.7146 - val_accuracy: 0.7722 - val_loss: 0.6664
Epoch 6/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 14ms/step - accuracy: 0.7729 - loss: 0.6443 - val_accuracy: 0.7906 - val_loss: 0.6168
Epoch 7/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 14ms/step - accuracy: 0.7867 - loss: 0.6058 - val_accuracy: 0.7760 - val_loss: 0.6534
Epoch 8/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 15ms/step - accuracy: 0.8041 - loss: 0.5569 - val_accuracy: 0.8084 - val_loss: 0.5519
Epoch 9/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 14ms/step - accuracy: 0.8187 - loss: 0.5194 - val_accuracy: 0.7756 - val_loss: 0.6638
Epoch 10/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 15ms/step - accuracy: 0.8276 - loss: 0.4866 - val_accuracy: 0.7986 - val_loss: 0.6157
Epoch 11/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 10s 15ms/step - accuracy: 0.8365 - loss: 0.4633 - val_accuracy: 0.8254 - val_loss: 0.5134
Epoch 12/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 14ms/step - accuracy: 0.8479 - loss: 0.4372 - val_accuracy: 0.8242 - val_loss: 0.5171
Epoch 13/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 15ms/step - accuracy: 0.8516 - loss: 0.4150 - val_accuracy: 0.8328 - val_loss: 0.4937
Epoch 14/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 15ms/step - accuracy: 0.8639 - loss: 0.3913 - val_accuracy: 0.8426 - val_loss: 0.4729
Epoch 15/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 10s 15ms/step - accuracy: 0.8696 - loss: 0.3671 - val_accuracy: 0.8378 - val_loss: 0.4963
Epoch 16/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 10s 15ms/step - accuracy: 0.8725 - loss: 0.3576 - val_accuracy: 0.8368 - val_loss: 0.5001
Epoch 17/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 11s 16ms/step - accuracy: 0.8756 - loss: 0.3448 - val_accuracy: 0.8498 - val_loss: 0.4708
Epoch 18/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 10s 15ms/step - accuracy: 0.8857 - loss: 0.3283 - val_accuracy: 0.8460 - val_loss: 0.4725
Epoch 19/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 15ms/step - accuracy: 0.8870 - loss: 0.3193 - val_accuracy: 0.8484 - val_loss: 0.4735
Epoch 20/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 10s 15ms/step - accuracy: 0.8879 - loss: 0.3110 - val_accuracy: 0.8424 - val_loss: 0.4934
Epoch 21/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 15ms/step - accuracy: 0.8939 - loss: 0.2949 - val_accuracy: 0.8504 - val_loss: 0.4926
Epoch 22/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 14ms/step - accuracy: 0.8993 - loss: 0.2830 - val_accuracy: 0.8534 - val_loss: 0.4761
Epoch 23/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 15ms/step - accuracy: 0.8995 - loss: 0.2797 - val_accuracy: 0.8450 - val_loss: 0.4954
Epoch 24/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 14ms/step - accuracy: 0.9030 - loss: 0.2683 - val_accuracy: 0.8462 - val_loss: 0.5062
Epoch 25/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 15ms/step - accuracy: 0.9105 - loss: 0.2521 - val_accuracy: 0.8618 - val_loss: 0.4506
Epoch 26/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 15ms/step - accuracy: 0.9088 - loss: 0.2527 - val_accuracy: 0.8636 - val_loss: 0.4389
Epoch 27/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 10s 15ms/step - accuracy: 0.9119 - loss: 0.2433 - val_accuracy: 0.8658 - val_loss: 0.4509
Epoch 28/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 10s 15ms/step - accuracy: 0.9127 - loss: 0.2426 - val_accuracy: 0.8540 - val_loss: 0.5006
Epoch 29/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 10s 15ms/step - accuracy: 0.9188 - loss: 0.2273 - val_accuracy: 0.8580 - val_loss: 0.4780
Epoch 30/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 15ms/step - accuracy: 0.9191 - loss: 0.2233 - val_accuracy: 0.8464 - val_loss: 0.5104
Epoch 31/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 15ms/step - accuracy: 0.9184 - loss: 0.2284 - val_accuracy: 0.8560 - val_loss: 0.4549
Epoch 32/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 14ms/step - accuracy: 0.9214 - loss: 0.2198 - val_accuracy: 0.8554 - val_loss: 0.4984
Epoch 33/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 14ms/step - accuracy: 0.9234 - loss: 0.2098 - val_accuracy: 0.8568 - val_loss: 0.4962
Epoch 34/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 15ms/step - accuracy: 0.9300 - loss: 0.1986 - val_accuracy: 0.8524 - val_loss: 0.5249
Epoch 35/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 14ms/step - accuracy: 0.9291 - loss: 0.1979 - val_accuracy: 0.8640 - val_loss: 0.4394
Epoch 36/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 15ms/step - accuracy: 0.9271 - loss: 0.2011 - val_accuracy: 0.8542 - val_loss: 0.5147
Epoch 37/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 10s 15ms/step - accuracy: 0.9329 - loss: 0.1883 - val_accuracy: 0.8688 - val_loss: 0.4523
Epoch 38/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 14ms/step - accuracy: 0.9323 - loss: 0.1849 - val_accuracy: 0.8686 - val_loss: 0.4619
Epoch 39/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 14ms/step - accuracy: 0.9337 - loss: 0.1844 - val_accuracy: 0.8468 - val_loss: 0.5449
Epoch 40/40
352/352 ━━━━━━━━━━━━━━━━━━━━ 5s 15ms/step - accuracy: 0.9302 - loss: 0.1912 - val_accuracy: 0.8636 - val_loss: 0.4712

# Extract accuracy values from training history
acc = history.history['accuracy']
val_acc = history.history['val_accuracy']
epochs = range(1, len(acc) + 1)

# Create the plot (Training and Validation Accuracy)
plt.figure(figsize=(10, 6))
plt.plot(epochs, acc, label='Training Accuracy')
plt.plot(epochs, val_acc, label='Validation Accuracy')
plt.title('Training vs. Validation Accuracy')
plt.xlabel('Epoch')
plt.ylabel('Accuracy')
plt.legend(loc='lower right')
plt.grid(True)
plt.show()

# Extract loss values from training history
loss = history.history['loss']
val_loss = history.history['val_loss']
epochs = range(1, len(loss) + 1)

# Create the plot (Training and Validation Loss)
plt.figure(figsize=(10, 6))
plt.plot(epochs, loss, label='Training Loss')
plt.plot(epochs, val_loss, label='Validation Loss')
plt.title('Training vs. Validation Loss')
plt.xlabel('Epoch')
plt.ylabel('Loss')
plt.legend(loc='upper right')
plt.grid(True)
plt.show()

# In this cell type in your code to evaluate your model on the test samples.
# Display your classification report with metrics rounded to 4 decimal places.


from sklearn.metrics import classification_report

# Get predicted class labels for the test set
y_pred_probs = model.predict(X_test / 255.0)  # normalize test data
y_pred = y_pred_probs.argmax(axis=1)  # Convert softmax outputs to predicted class indices

# Generate classification report
print("Classification Report (rounded to 4 decimal places):\n")
print(classification_report(y_test, y_pred, target_names=classes, digits=4))

313/313 ━━━━━━━━━━━━━━━━━━━━ 1s 3ms/step
Classification Report (rounded to 4 decimal places):

              precision    recall  f1-score   support

    airplane     0.8480    0.8760    0.8618      1000
  automobile     0.9025    0.9530    0.9270      1000
        bird     0.7548    0.8650    0.8062      1000
         cat     0.7676    0.7100    0.7377      1000
        deer     0.8815    0.8330    0.8566      1000
         dog     0.8280    0.7560    0.7904      1000
        frog     0.8716    0.9230    0.8966      1000
       horse     0.9479    0.8370    0.8890      1000
        ship     0.9314    0.8960    0.9134      1000
       truck     0.8673    0.9350    0.8999      1000

    accuracy                         0.8584     10000
   macro avg     0.8601    0.8584    0.8578     10000
weighted avg     0.8601    0.8584    0.8578     10000

# In this cell type in your code and run it to display the first 20 misclassified images
# For each misclassified image show (y_true, y_pred, prob),

# Get top predicted probabilities
pred_probs = np.max(y_pred_probs, axis=1)

# Flatten true labels for comparison
y_true = y_test.flatten()

# Identify misclassified indices
misclassified_indices = np.where(y_pred != y_true)[0]

# Show first 20 misclassified examples
num_to_show = 20
plt.figure(figsize=(15, 10))

for i, idx in enumerate(misclassified_indices[:num_to_show]):
    plt.subplot(4, 5, i+1)
    plt.imshow(X_test[idx])
    plt.title(f"True: {classes[y_true[idx]]}\nPred: {classes[y_pred[idx]]}\nProb: {pred_probs[idx]:.4f}")
    plt.axis('off')

plt.tight_layout()
plt.show()

Model	Description	Outcome	Reason for Rejection
Basic CNN (3 conv layers)	Used ReLU, smaller structure	~76% val accuracy	Underperformed
Deeper CNN (5 conv layers, ReLU)	Same structure but deeper	Peaked at ~83.6% val accuracy	Plateaued before 85%
Same model with SGD optimizer	Swapped Adam with SGD+momentum	Slower convergence, less stable	Lower final accuracy
Same model with EarlyStopping	Tried to cut overfitting early	Trained shorter but didn’t improve	Stopped before hitting 85%
Augmented model	Used `ImageDataGenerator` (flip, shift, rotate)	Slight improvements, but unstable and slow	Caused compatibility or memory issues
Very deep model (6 conv layers + pooling)	LeakyReLU, Dropout, SGD	Took over 2 hours per epoch, stopped after 2	Impractical to run
Normalization (X_train / 255.0)	Tested normalized pixel values	Didn’t improve enough to justify changes	Final model didn’t use it

Steven Lora - MSIT 675 Project 1 - Convolution Neural Networks¶

Get CIFAR 10 dataset¶

Create Model [15 Points]¶

Model Compilation¶

Train model [5 Points]¶

Model Training¶

Final Model Summary¶

Other Models Tried (and Why They Were Rejected)¶

Why We Chose the Final Model¶

Check for over-fitting [5 Points]¶

Evaluate trained model [5 Points]¶

Model Evaluation¶

Display misclassified images [5 Points]¶

Conclusion¶

Final Notes¶

	Class	Name
0	0	airplane
1	1	automobile
2	2	bird
3	3	cat
4	4	deer
5	5	dog
6	6	frog
7	7	horse
8	8	ship
9	9	truck