import tensorflow as tf
import matplotlib.pyplot as plt

# Loading Fashion MNIST dataset

fashion_mnist = tf.keras.datasets.fashion_mnist
(training_images, training_labels), (testing_images, testing_labels) = fashion_mnist.load_data()

# Normalizing the images

training_images=training_images/255.0
testing_images = testing_images/255.0

class callback(tf.keras.callbacks.Callback):
    def on_epoch_end(self, epoch, logs = {}):
        if logs['accuracy'] >= 0.98:
            print('Reached 98%. Stopping the training')
            self.model.stop_training = True

model = tf.keras.models.Sequential([
    tf.keras.Input(shape=(28,28,1)),  # Input will come first
    tf.keras.layers.Conv2D(64, (3,3), activation='relu'),  # First convolution layer. Explained below
    tf.keras.layers.MaxPool2D(2,2),    # First maxpooling layer. Explained below
    tf.keras.layers.Conv2D(64, (3,3), activation='relu'), # Second covolution layer
    tf.keras.layers.MaxPool2D(2,2),  # Second maxpooling layer
    tf.keras.layers.Flatten(),  # Flatten layer
    tf.keras.layers.Dense(128, activation='relu'),  # First dense layer
    tf.keras.layers.Dense(10, activation='softmax')  # Output layer
])

model.summary()

Model: "sequential"

┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
┃ Layer (type)                         ┃ Output Shape                ┃         Param # ┃
┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
│ conv2d (Conv2D)                      │ (None, 26, 26, 64)          │             640 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ max_pooling2d (MaxPooling2D)         │ (None, 13, 13, 64)          │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ conv2d_1 (Conv2D)                    │ (None, 11, 11, 64)          │          36,928 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ max_pooling2d_1 (MaxPooling2D)       │ (None, 5, 5, 64)            │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ flatten (Flatten)                    │ (None, 1600)                │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dense (Dense)                        │ (None, 128)                 │         204,928 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dense_1 (Dense)                      │ (None, 10)                  │           1,290 │
└──────────────────────────────────────┴─────────────────────────────┴─────────────────┘

 Total params: 243,786 (952.29 KB)

 Trainable params: 243,786 (952.29 KB)

 Non-trainable params: 0 (0.00 B)

model.compile(optimizer='adam', loss=tf.keras.losses.SparseCategoricalCrossentropy(), metrics = ['accuracy'])

model.fit(training_images, training_labels, epochs = 30, callbacks=[callback()])

Epoch 1/30
1875/1875 ━━━━━━━━━━━━━━━━━━━━ 9s 4ms/step - accuracy: 0.7852 - loss: 0.5989
Epoch 2/30
1875/1875 ━━━━━━━━━━━━━━━━━━━━ 7s 4ms/step - accuracy: 0.8865 - loss: 0.3069
Epoch 3/30
1875/1875 ━━━━━━━━━━━━━━━━━━━━ 8s 4ms/step - accuracy: 0.9052 - loss: 0.2546
Epoch 4/30
1875/1875 ━━━━━━━━━━━━━━━━━━━━ 8s 4ms/step - accuracy: 0.9191 - loss: 0.2157
Epoch 5/30
1875/1875 ━━━━━━━━━━━━━━━━━━━━ 8s 4ms/step - accuracy: 0.9297 - loss: 0.1880
Epoch 6/30
1875/1875 ━━━━━━━━━━━━━━━━━━━━ 8s 4ms/step - accuracy: 0.9392 - loss: 0.1617
Epoch 7/30
1875/1875 ━━━━━━━━━━━━━━━━━━━━ 8s 4ms/step - accuracy: 0.9465 - loss: 0.1442
Epoch 8/30
1875/1875 ━━━━━━━━━━━━━━━━━━━━ 8s 4ms/step - accuracy: 0.9522 - loss: 0.1276
Epoch 9/30
1875/1875 ━━━━━━━━━━━━━━━━━━━━ 8s 4ms/step - accuracy: 0.9590 - loss: 0.1088
Epoch 10/30
1875/1875 ━━━━━━━━━━━━━━━━━━━━ 8s 4ms/step - accuracy: 0.9640 - loss: 0.0960
Epoch 11/30
1875/1875 ━━━━━━━━━━━━━━━━━━━━ 8s 4ms/step - accuracy: 0.9671 - loss: 0.0856
Epoch 12/30
1875/1875 ━━━━━━━━━━━━━━━━━━━━ 8s 4ms/step - accuracy: 0.9704 - loss: 0.0764
Epoch 13/30
1875/1875 ━━━━━━━━━━━━━━━━━━━━ 8s 4ms/step - accuracy: 0.9751 - loss: 0.0678
Epoch 14/30
1875/1875 ━━━━━━━━━━━━━━━━━━━━ 8s 4ms/step - accuracy: 0.9775 - loss: 0.0585
Epoch 15/30
1875/1875 ━━━━━━━━━━━━━━━━━━━━ 8s 4ms/step - accuracy: 0.9811 - loss: 0.0508
Epoch 16/30
1875/1875 ━━━━━━━━━━━━━━━━━━━━ 8s 4ms/step - accuracy: 0.9808 - loss: 0.0494
Epoch 17/30
1870/1875 ━━━━━━━━━━━━━━━━━━━━ 0s 5ms/step - accuracy: 0.9840 - loss: 0.0426Reached 98%. Stopping the training
1875/1875 ━━━━━━━━━━━━━━━━━━━━ 9s 5ms/step - accuracy: 0.9840 - loss: 0.0426

<keras.src.callbacks.history.History at 0x1d60e7c9060>

# Now we will evaluate the model

test_loss, test_accuracy = model.evaluate(testing_images, testing_labels, verbose=0)
print('Loss is ',test_loss)
print('Accuracy is ',test_accuracy)

Loss is  0.41473188996315
Accuracy is  0.9126999974250793

import numpy as np
np.argmax(model.predict(testing_images[104:105]))

1/1 ━━━━━━━━━━━━━━━━━━━━ 0s 17ms/step

7

testing_labels[104]

7

[i for i in range(50) if testing_labels[i] == 7]

[9, 12, 22, 36, 38, 43, 45]

FIRST_IMAGE = 9
SECOND_IMAGE = 22
THIRD_IMAGE = 45

CONVOLUTION_NUMBER = 2

LAYERS_TO_VIZUALIZE = [tf.keras.layers.Conv2D, tf.keras.layers.MaxPooling2D]

model.layers

[<Conv2D name=conv2d, built=True>,
 <MaxPooling2D name=max_pooling2d, built=True>,
 <Conv2D name=conv2d_1, built=True>,
 <MaxPooling2D name=max_pooling2d_1, built=True>,
 <Flatten name=flatten, built=True>,
 <Dense name=dense, built=True>,
 <Dense name=dense_1, built=True>]

layer_outputs = [layer.output for layer in model.layers if type(layer) in LAYERS_TO_VIZUALIZE]
layer_outputs

[<KerasTensor shape=(None, 26, 26, 64), dtype=float32, sparse=False, name=keras_tensor_1>,
 <KerasTensor shape=(None, 13, 13, 64), dtype=float32, sparse=False, name=keras_tensor_2>,
 <KerasTensor shape=(None, 11, 11, 64), dtype=float32, sparse=False, name=keras_tensor_3>,
 <KerasTensor shape=(None, 5, 5, 64), dtype=float32, sparse=False, name=keras_tensor_4>]

model.inputs

[<KerasTensor shape=(None, 28, 28, 1), dtype=float32, sparse=None, name=keras_tensor>]

activation_model = tf.keras.models.Model(inputs=model.inputs, outputs=layer_outputs)
activation_model

<Functional name=functional_4, built=True>

f, axis = plt.subplots(3, len(layer_outputs))  #3 rows (for the three images) and len(layer_outputs) columns (one for each layer to visualize)


#A loop that iterates over each layer output in layer_outputs. x is the index for the layer you're processing in each iteration.
for x in range(len(layer_outputs)):
    f1 = activation_model.predict(testing_images[FIRST_IMAGE].reshape(1,28,28,1), verbose=False)[x]
    axis[0, x].imshow(f1[0, :, :, CONVOLUTION_NUMBER], cmap = 'inferno')
    axis[0,x].grid(False)

    f2 = activation_model.predict(testing_images[SECOND_IMAGE].reshape(1,28,28,1), verbose=False)[x]
    axis[1, x].imshow(f2[0, :, :, CONVOLUTION_NUMBER], cmap = 'inferno')
    axis[1,x].grid(False)

    f3 = activation_model.predict(testing_images[THIRD_IMAGE].reshape(1,28,28,1), verbose=False)[x]
    axis[2, x].imshow(f3[0, :, :, CONVOLUTION_NUMBER], cmap = 'inferno')
    axis[2,x].grid(False)

CONVOLUTION_NUMBER = 30

f, axis = plt.subplots(3, len(layer_outputs))  #3 rows (for the three images) and len(layer_outputs) columns (one for each layer to visualize)


#A loop that iterates over each layer output in layer_outputs. x is the index for the layer you're processing in each iteration.
for x in range(len(layer_outputs)):
    f1 = activation_model.predict(testing_images[FIRST_IMAGE].reshape(1,28,28,1), verbose=False)[x]
    axis[0, x].imshow(f1[0, :, :, CONVOLUTION_NUMBER], cmap = 'inferno')
    axis[0,x].grid(False)

    f2 = activation_model.predict(testing_images[SECOND_IMAGE].reshape(1,28,28,1), verbose=False)[x]
    axis[1, x].imshow(f2[0, :, :, CONVOLUTION_NUMBER], cmap = 'inferno')
    axis[1,x].grid(False)

    f3 = activation_model.predict(testing_images[THIRD_IMAGE].reshape(1,28,28,1), verbose=False)[x]
    axis[2, x].imshow(f3[0, :, :, CONVOLUTION_NUMBER], cmap = 'inferno')
    axis[2,x].grid(False)

Convolutional Neural Networks (CNNs) - Summary¶

Code¶

Visualizing convolution and maxpooling layers¶