# import libraries

import keras
from keras import layers, models, Input, optimizers, ops
import matplotlib.pyplot as plt
import tensorflow as tf
import numpy as np

def get_data():
  """Returns images of Trousers, Pullovers, and Sneakers relabeled 0, 1, 2"""
  (x_train, y_train), (x_test, y_test) = keras.datasets.fashion_mnist.load_data()
  all_images = np.concatenate([x_train, x_test])
  all_labels = np.concatenate([y_train, y_test])
  retained_indices = np.where(np.isin(all_labels, [1, 2, 7]))
  retained_images = all_images[retained_indices]
  retained_labels = all_labels[retained_indices]
  # Map labels to new values
  label_mapping = {1: 0, 2: 1, 7: 2}
  mapped_labels = np.vectorize(label_mapping.get)(retained_labels)
  ITEMS = ['Trouser', 'Pullover', 'Sneaker']
  return retained_images, mapped_labels, ITEMS

all_images, all_class_labels, ITEMS = get_data()

print(f'Shape of images: {all_images.shape}')
print(f'Shape of labels: {all_class_labels.shape}')
print(f'Unique labels: {np.unique(all_class_labels)}')
print(f'Items: {[(i, item) for i,item in enumerate(ITEMS)]}')

Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/train-labels-idx1-ubyte.gz
29515/29515 ━━━━━━━━━━━━━━━━━━━━ 0s 0us/step
Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/train-images-idx3-ubyte.gz
26421880/26421880 ━━━━━━━━━━━━━━━━━━━━ 1s 0us/step
Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/t10k-labels-idx1-ubyte.gz
5148/5148 ━━━━━━━━━━━━━━━━━━━━ 0s 0us/step
Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/t10k-images-idx3-ubyte.gz
4422102/4422102 ━━━━━━━━━━━━━━━━━━━━ 0s 0us/step
Shape of images: (21000, 28, 28)
Shape of labels: (21000,)
Unique labels: [0 1 2]
Items: [(0, 'Trouser'), (1, 'Pullover'), (2, 'Sneaker')]

def displayImages(images, labels, nCols=10):
    """Displays images with labels (nCols per row)"""
    nRows = np.ceil(len(labels)/nCols).astype('int') # number of rows
    plt.figure(figsize=(nCols,nRows)) # figure size
    for i in range(len(labels)):
        plt.subplot(nRows,nCols,i+1)
        plt.xticks([])
        plt.yticks([])
        plt.grid(False)
        plt.imshow(images[i], interpolation='spline16', cmap='gray_r')
        plt.xlabel(f'{labels[i]}', fontsize=12)
    plt.tight_layout()
    plt.show()
    return

# display the first k images with labels
k = 30
images = all_images[:k]
labels = [ITEMS[label] for label in all_class_labels[:k]]
displayImages(images, labels)

# Specify parameters to create your CGAN model in this code cell

batch_size = 64 # batch size used for training
num_channels = 1 # grayscale images (3 for RGB)
num_classes = 3 # 3 Classes (0, 'Trouser'), (1, 'Pullover'), (2, 'Sneaker')
image_size = 28 # width and height of images
latent_dim = 512 # number of dimensions of hypersphere for sampling
generator_in_channels = latent_dim + num_classes # number of channels in generator input
discriminator_in_channels = num_channels + num_classes # number of channels in discriminator input

# Code to preprocess the data

# Scale the pixel values to [0, 1] range
all_images = all_images.astype("float32") / 255.0

# add a channel dimension to he images
all_images = np.reshape(all_images, (-1, 28, 28, 1))

# one-hot encode the labels
all_labels = keras.utils.to_categorical(all_class_labels, 3)

# Create tf.data.Dataset
dataset = tf.data.Dataset.from_tensor_slices((all_images, all_labels))
dataset = dataset.shuffle(buffer_size=1024).batch(batch_size)

# print the shapes of the resulting images labels
print(f"Shape of images: {all_images.shape}")
print(f"Shape of labels: {all_labels.shape}")

Shape of images: (21000, 28, 28, 1)
Shape of labels: (21000, 3)

# Create the discriminator model
discriminator = keras.Sequential(
    [
        # input shape 28 x 28 x 4
        keras.layers.InputLayer((28, 28, discriminator_in_channels)),

        # First Concolution Layer
        # Number of Parameters = (3 * 3 * 4 + 1) * 64 = 2,368
        layers.Conv2D(64, (3, 3), strides=(2, 2), padding="same", name='Conv1'),
        layers.LeakyReLU(negative_slope=0.2),
        layers.Dropout(0.25),
        # Output shape = 14 x 14 x 64

        # Second Convolution Layer
        # Number of Parameters = (3 * 3 * 64 + 1) * 126 = 73,856
        layers.Conv2D(128, (3, 3), strides=(2, 2), padding="same", name='Conv2'),
        layers.LeakyReLU(negative_slope=0.2),
        layers.Dropout(0.25),
        # Output shape = 7 x 7 x 128

        # Third Convolution Layer
        # Number of Parameters = (3 * 3 * 128 + 1) * 256 = 295,168
        layers.Conv2D(256, (3, 3), strides=(1, 1), padding="same", name='Conv3'),
        layers.LeakyReLU(negative_slope=0.2),
        layers.Dropout(0.25),
        # Output shape = 7 x 7 x 256

        # Fourth Convolution Layer
        # Number of Parameters = (3 * 3 * 256 + 1) * 512 = 1,180,160
        layers.Conv2D(512, (3, 3), strides=(1, 1), padding="same", name='Conv4'),
        layers.LeakyReLU(negative_slope=0.2),
        layers.Dropout(0.25),
        # Output shape = 7 x 7 x 512

        # Global Max Pooling takes max value from the 512 Channels
        layers.GlobalMaxPooling2D(),
        # Output score: logit(score = probability that image is real)
        layers.Dense(1),
    ],
    name="discriminator",
)

# print the shape of the model input
print(f'Input shape for discriminator: {discriminator.input_shape}')

# display the summary of the model.
discriminator.summary()

Input shape for discriminator: (None, 28, 28, 4)

Model: "discriminator"

┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
┃ Layer (type)                         ┃ Output Shape                ┃         Param # ┃
┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
│ Conv1 (Conv2D)                       │ (None, 14, 14, 64)          │           2,368 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ leaky_re_lu (LeakyReLU)              │ (None, 14, 14, 64)          │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dropout (Dropout)                    │ (None, 14, 14, 64)          │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ Conv2 (Conv2D)                       │ (None, 7, 7, 128)           │          73,856 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ leaky_re_lu_1 (LeakyReLU)            │ (None, 7, 7, 128)           │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dropout_1 (Dropout)                  │ (None, 7, 7, 128)           │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ Conv3 (Conv2D)                       │ (None, 7, 7, 256)           │         295,168 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ leaky_re_lu_2 (LeakyReLU)            │ (None, 7, 7, 256)           │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dropout_2 (Dropout)                  │ (None, 7, 7, 256)           │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ Conv4 (Conv2D)                       │ (None, 7, 7, 512)           │       1,180,160 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ leaky_re_lu_3 (LeakyReLU)            │ (None, 7, 7, 512)           │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dropout_3 (Dropout)                  │ (None, 7, 7, 512)           │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ global_max_pooling2d                 │ (None, 512)                 │               0 │
│ (GlobalMaxPooling2D)                 │                             │                 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dense (Dense)                        │ (None, 1)                   │             513 │
└──────────────────────────────────────┴─────────────────────────────┴─────────────────┘

 Total params: 1,552,065 (5.92 MB)

 Trainable params: 1,552,065 (5.92 MB)

 Non-trainable params: 0 (0.00 B)

# Create the generator model
generator = keras.Sequential(
    [
        # Input Layer 512 + 3 = 515
        keras.layers.InputLayer((generator_in_channels,)),
        layers.Dense(7 * 7 * latent_dim),
        layers.BatchNormalization(),
        layers.LeakyReLU(negative_slope=0.2),
        layers.Reshape((7, 7, latent_dim)),
        # Output shape 7 x 7 x 515


        # First Convolution 2D Transpose Layer
        layers.Conv2DTranspose(128, (4, 4), strides=(2, 2), padding="same", name='C2DT_1'),
        layers.BatchNormalization(),
        layers.LeakyReLU(negative_slope=0.2),
        # Output 14 x 14 x 128

        # Second Convolution 2D Transpose Layer
        layers.Conv2DTranspose(64, (4, 4), strides=(2, 2), padding="same", name='C2DT_2'),
        layers.BatchNormalization(),
        layers.LeakyReLU(negative_slope=0.2),
        # Output 28 x 28 x 64

        # Third Convolution 2D Transpose Layer
        layers.Conv2DTranspose(32, (4, 4), strides=(1, 1), padding="same", name='C2DT_3'),
        layers.BatchNormalization(),
        layers.LeakyReLU(negative_slope=0.2),
        # Output 28 x 28 x 32

        # Fourth Convolution 2D Transpose Layer
        # layers.Conv2DTranspose(16, (4, 4), strides=(1, 1), padding="same", name='C2DT_4'),
        # layers.BatchNormalization(),
        # layers.LeakyReLU(negative_slope=0.2),
        # Output 28 x 28 x 16

        # Convolution Layer
        layers.Conv2D(1, (3, 3), padding="same", activation="sigmoid", name='Conv1'),
    ],
    name="generator",
)

# print the shape of the model input
print(f'Input shape for generator: {generator.input_shape}')

# display the summary of the model
print(generator.summary())

Input shape for generator: (None, 515)

Model: "generator"

┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
┃ Layer (type)                         ┃ Output Shape                ┃         Param # ┃
┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
│ dense_1 (Dense)                      │ (None, 25088)               │      12,945,408 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ batch_normalization                  │ (None, 25088)               │         100,352 │
│ (BatchNormalization)                 │                             │                 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ leaky_re_lu_4 (LeakyReLU)            │ (None, 25088)               │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ reshape (Reshape)                    │ (None, 7, 7, 512)           │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ C2DT_1 (Conv2DTranspose)             │ (None, 14, 14, 128)         │       1,048,704 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ batch_normalization_1                │ (None, 14, 14, 128)         │             512 │
│ (BatchNormalization)                 │                             │                 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ leaky_re_lu_5 (LeakyReLU)            │ (None, 14, 14, 128)         │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ C2DT_2 (Conv2DTranspose)             │ (None, 28, 28, 64)          │         131,136 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ batch_normalization_2                │ (None, 28, 28, 64)          │             256 │
│ (BatchNormalization)                 │                             │                 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ leaky_re_lu_6 (LeakyReLU)            │ (None, 28, 28, 64)          │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ C2DT_3 (Conv2DTranspose)             │ (None, 28, 28, 32)          │          32,800 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ batch_normalization_3                │ (None, 28, 28, 32)          │             128 │
│ (BatchNormalization)                 │                             │                 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ leaky_re_lu_7 (LeakyReLU)            │ (None, 28, 28, 32)          │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ Conv1 (Conv2D)                       │ (None, 28, 28, 1)           │             289 │
└──────────────────────────────────────┴─────────────────────────────┴─────────────────┘

 Total params: 14,259,585 (54.40 MB)

 Trainable params: 14,208,961 (54.20 MB)

 Non-trainable params: 50,624 (197.75 KB)

None

# class ConditionalGAN

class ConditionalGAN(keras.Model):
    def __init__(self, discriminator, generator, latent_dim):
        super().__init__()
        self.discriminator = discriminator
        self.generator = generator
        self.latent_dim = latent_dim
        self.seed_generator = keras.random.SeedGenerator(1337)
        self.gen_loss_tracker = keras.metrics.Mean(name="generator_loss")
        self.disc_loss_tracker = keras.metrics.Mean(name="discriminator_loss")

    @property
    def metrics(self):
        return [self.gen_loss_tracker, self.disc_loss_tracker]

    def compile(self, d_optimizer, g_optimizer, loss_fn):
        super().compile()
        self.d_optimizer = d_optimizer
        self.g_optimizer = g_optimizer
        self.loss_fn = loss_fn

    def train_step(self, data):
        # Unpack the data.
        real_images, one_hot_labels = data

        # Add dummy dimensions to the labels so that they can be concatenated with
        # the images. This is for the discriminator.
        image_one_hot_labels = one_hot_labels[:, :, None, None]
        image_one_hot_labels = ops.repeat(
            image_one_hot_labels, repeats=[image_size * image_size]
        )
        image_one_hot_labels = ops.reshape(
            image_one_hot_labels, (-1, image_size, image_size, num_classes)
        )

        # Sample random points in the latent space and concatenate the labels.
        # This is for the generator.
        batch_size = ops.shape(real_images)[0]
        random_latent_vectors = keras.random.normal(
            shape=(batch_size, self.latent_dim), seed=self.seed_generator
        )
        random_vector_labels = ops.concatenate(
            [random_latent_vectors, one_hot_labels], axis=1
        )

        # Decode the noise (guided by labels) to fake images.
        generated_images = self.generator(random_vector_labels)

        # Combine them with real images. Note that we are concatenating the labels
        # with these images here.
        fake_image_and_labels = ops.concatenate(
            [generated_images, image_one_hot_labels], -1
        )
        real_image_and_labels = ops.concatenate([real_images, image_one_hot_labels], -1)
        combined_images = ops.concatenate(
            [fake_image_and_labels, real_image_and_labels], axis=0
        )

        # Assemble labels discriminating real from fake images.
        labels = ops.concatenate(
            [ops.ones((batch_size, 1)), ops.zeros((batch_size, 1))], axis=0
        )

        # Train the discriminator.
        with tf.GradientTape() as tape:
            predictions = self.discriminator(combined_images)
            d_loss = self.loss_fn(labels, predictions)
        grads = tape.gradient(d_loss, self.discriminator.trainable_weights)
        self.d_optimizer.apply_gradients(
            zip(grads, self.discriminator.trainable_weights)
        )

        # Sample random points in the latent space.
        random_latent_vectors = keras.random.normal(
            shape=(batch_size, self.latent_dim), seed=self.seed_generator
        )
        random_vector_labels = ops.concatenate(
            [random_latent_vectors, one_hot_labels], axis=1
        )

        # Assemble labels that say "all real images".
        misleading_labels = ops.zeros((batch_size, 1))

        # Train the generator (note that we should *not* update the weights
        # of the discriminator)!
        with tf.GradientTape() as tape:
            fake_images = self.generator(random_vector_labels)
            fake_image_and_labels = ops.concatenate(
                [fake_images, image_one_hot_labels], -1
            )
            predictions = self.discriminator(fake_image_and_labels)
            g_loss = self.loss_fn(misleading_labels, predictions)
        grads = tape.gradient(g_loss, self.generator.trainable_weights)
        self.g_optimizer.apply_gradients(zip(grads, self.generator.trainable_weights))

        # Monitor loss.
        self.gen_loss_tracker.update_state(g_loss)
        self.disc_loss_tracker.update_state(d_loss)
        return {
            "g_loss": self.gen_loss_tracker.result(),
            "d_loss": self.disc_loss_tracker.result(),
        }

# create model
cond_gan = ConditionalGAN(
    discriminator = discriminator, generator = generator, latent_dim = latent_dim
)

cond_gan.compile(
    d_optimizer = keras.optimizers.Adam(learning_rate = 0.0003),
    g_optimizer = keras.optimizers.Adam(learning_rate = 0.0003),
    loss_fn = keras.losses.BinaryCrossentropy(from_logits=True),
    )

# display the summary of the model
cond_gan.summary()

Model: "conditional_gan"

┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
┃ Layer (type)                         ┃ Output Shape                ┃         Param # ┃
┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
│ discriminator (Sequential)           │ (None, 1)                   │       1,552,065 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ generator (Sequential)               │ (None, 28, 28, 1)           │      14,259,585 │
└──────────────────────────────────────┴─────────────────────────────┴─────────────────┘

 Total params: 15,811,650 (60.32 MB)

 Trainable params: 15,761,026 (60.12 MB)

 Non-trainable params: 50,624 (197.75 KB)

# Define function: generate_fake_images
def generate_fake_images(generator_model, class_label_list):
  """Returns fake images of digits in digit_list using model"""
  labels = keras.utils.to_categorical(class_label_list, num_classes)
  labels = ops.cast(labels, "float32")
  noise = keras.random.normal(shape=(len(class_label_list), latent_dim))
  noise_and_labels = ops.concatenate([noise, labels], 1)
  fake = generator_model.predict(noise_and_labels, verbose=0)
  return fake

# Train the model over 30 epochs.

class_label_list = 3*[0] + 3*[1] + 3*[2] # display 3 images of each class
print(f"class_label_list: {class_label_list}")

epochs = 30 # number of epochs specified by assignment

for i in range(epochs):
  cond_gan.fit(dataset, epochs=1) # train model
  cond_gan.generator.save_weights(f"generator_epoch_{i+1}.weights.h5") # save weights
  images = generate_fake_images(cond_gan.generator, class_label_list) # fake images
  print(f'Fake images after epoch {i+1}:') # epoch heading
  displayImages(images, class_label_list) # display images
  print()

class_label_list: [0, 0, 0, 1, 1, 1, 2, 2, 2]
329/329 ━━━━━━━━━━━━━━━━━━━━ 35s 55ms/step - d_loss: 0.2747 - g_loss: 5.4549
Fake images after epoch 1:

329/329 ━━━━━━━━━━━━━━━━━━━━ 13s 39ms/step - d_loss: 0.2564 - g_loss: 3.4446
Fake images after epoch 2:

329/329 ━━━━━━━━━━━━━━━━━━━━ 13s 40ms/step - d_loss: 0.4253 - g_loss: 2.2602
Fake images after epoch 3:

329/329 ━━━━━━━━━━━━━━━━━━━━ 14s 41ms/step - d_loss: 0.4115 - g_loss: 2.4745
Fake images after epoch 4:

329/329 ━━━━━━━━━━━━━━━━━━━━ 13s 40ms/step - d_loss: 0.4104 - g_loss: 2.0053
Fake images after epoch 5:

329/329 ━━━━━━━━━━━━━━━━━━━━ 13s 40ms/step - d_loss: 0.4202 - g_loss: 2.1133
Fake images after epoch 6:

329/329 ━━━━━━━━━━━━━━━━━━━━ 13s 40ms/step - d_loss: 0.4556 - g_loss: 1.9841
Fake images after epoch 7:

329/329 ━━━━━━━━━━━━━━━━━━━━ 13s 41ms/step - d_loss: 0.4009 - g_loss: 1.9964
Fake images after epoch 8:

329/329 ━━━━━━━━━━━━━━━━━━━━ 13s 41ms/step - d_loss: 0.4124 - g_loss: 2.0065
Fake images after epoch 9:

329/329 ━━━━━━━━━━━━━━━━━━━━ 13s 41ms/step - d_loss: 0.3626 - g_loss: 2.0917
Fake images after epoch 10:

# choosing the weights and defining new generator
chosen_epoch = 30 # chosen epoch
chosen_generator = generator # reused the same generator instance defined earlier to ensure the architecture matches

# Load the weights
chosen_generator.load_weights(f"generator_epoch_{chosen_epoch}.weights.h5")

# Display fake images generated for classes specified in class_label_list.
class_label_list = 10*[0] + 10*[1] + 10*[2]
print(f"class_label_list: {class_label_list}")

images = generate_fake_images(chosen_generator, class_label_list)
print(f'Fake images:')
displayImages(images, [ITEMS[i] for i in class_label_list])

class_label_list: [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2]
Fake images:

Steven Lora - MSIT 675 Project 2 - Generative Adversarial Networks¶

Generate fake Fashion MNIST images¶

Import¶

Get data¶

Display images¶

Specify parameters [2 Points]¶

Preprocess [3 Points]¶

Create discriminator [5 Points]¶

Create generator [5 Points]¶

Create ConditionalGAN model [5 Points]¶

Function to generate fake images [5 Points]¶

Train model [5 Points]¶

Use trained generator [5 Points]¶

Conclusion¶