{"nbformat":4,"nbformat_minor":0,"metadata":{"colab":{"provenance":[],"collapsed_sections":["IMk9-Qiy3G8o","YgXg8ezlc05-","KUCRQ-UfdaLn","lBSZSvO-2QxJ"],"gpuType":"T4"},"kernelspec":{"name":"python3","display_name":"Python 3"},"language_info":{"name":"python"},"accelerator":"GPU"},"cells":[{"cell_type":"markdown","source":["The code is composed on Google Colab.\n","This Python notebook is devoted to training the beta-VAE on Fashion MNIST dataset.\n","\n","\n","Code modified from https://github.com/mdhabibi/DeepLearning-VAE/blob/main/notebooks/MNIST_VAE_main_dim%3D15.ipynb"],"metadata":{"id":"7aCoDoZM18A9"}},{"cell_type":"code","source":["from google.colab import drive\n","drive.mount('/content/drive')"],"metadata":{"id":"cNMAgMlCvpTZ"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["cd/content/drive/MyDrive/OTHJ_FashionMNIST_MNIST"],"metadata":{"id":"nPYJV5EjvvKc"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# @title imports\n","\n","\n","# Data Handling and Numerical Libraries\n","import os\n","import numpy as np                          # Handling large data arrays\n","import pandas as pd\n","import matplotlib.pyplot as plt             # Creating visualizations\n","from matplotlib.colors import ListedColormap\n","import seaborn as sns                       # Advanced data visualization\n","import random\n","\n","import tensorflow as tf\n","# Keras - Deep Learning API\n","import keras                                # High-level neural networks API\n","from keras.datasets import mnist            # MNIST dataset of hand-written digits\n","from keras.datasets import fashion_mnist\n","from keras.layers import (                  # Neural network layers\n","    Conv2D, Conv2DTranspose,\n","    Input, Flatten, Dense,\n","    Lambda, Reshape\n",")\n","from keras.models import Model              # Model definition and training\n","from keras.callbacks import (               # Training callbacks\n","    EarlyStopping, ModelCheckpoint\n",")\n","from keras import backend as K\n","from sklearn.manifold import TSNE\n","\n","import sys\n","sys.path.append('/Volumes/D/GitHub-Portfolio/DeepLearning-MNIST-VAE/src/')\n","\n","# Metrics\n","from keras.metrics import MeanSquaredError\n","from skimage.metrics import peak_signal_noise_ratio as psnr"],"metadata":{"id":"R0c-JSjpz9n_","cellView":"form"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# @title VAE Loss\n","\n","import keras\n","from keras import layers\n","from keras import backend as K\n","\n","class VAELossLayer(layers.Layer):\n","    \"\"\"\n","    Custom Keras layer that calculates the loss (reconstruction + KL divergence)\n","    of the Variational AutoEncoder (VAE)\n","    \"\"\"\n","\n","    def __init__(self, beta_recon=100., beta_kl=0.1, **kwargs):\n","    # def __init__(self, beta=0.0005, **kwargs):\n","        super().__init__(**kwargs)\n","        self.beta_recon = beta_recon\n","        self.beta_kl = beta_kl\n","\n","    def compute_output_shape(self, input_shape):\n","        return input_shape[0]  # or return ()\n","\n","    def calculate_loss(self, original_input, reconstructed_output, mu, sigma):\n","        \"\"\"\n","        Calculates VAE loss, which is the sum of the reconstruction loss and KL-divergence loss\n","        \"\"\"\n","        # print(original_input)\n","        original_input = tf.keras.layers.Flatten(data_format='channels_last')(original_input)\n","        reconstructed_output = tf.keras.layers.Flatten(data_format='channels_last')(reconstructed_output)\n","        # reconstruction_loss = keras.metrics.binary_crossentropy(original_input, reconstructed_output)\n","        reconstruction_loss = tf.reduce_sum(tf.square(original_input - reconstructed_output), axis=[1])\n","        reconstruction_loss = self.beta_recon * reconstruction_loss\n","        # kl_loss = -self.beta * K.mean(1 + sigma - K.square(mu) - tf.exp(sigma), axis=-1)\n","        kl_loss = -self.beta_kl * tf.reduce_mean(1 + sigma - tf.square(mu) - tf.exp(sigma), axis=-1)\n","\n","\n","        return tf.reduce_mean(reconstruction_loss + kl_loss)\n","        # return K.mean(reconstruction_loss + kl_loss)\n","\n","    def call(self, inputs):\n","        \"\"\"\n","        Computes the loss and adds it to the layer's losses\n","        \"\"\"\n","        original_input, reconstructed_output, mu, sigma = inputs\n","\n","        loss = self.calculate_loss(original_input, reconstructed_output, mu, sigma)\n","        self.add_loss(loss)\n","        return original_input"],"metadata":{"id":"VaALbLyi05jb","cellView":"form"},"execution_count":null,"outputs":[]},{"cell_type":"markdown","source":["Data processing\n","---\n","\n"],"metadata":{"id":"IMk9-Qiy3G8o"}},{"cell_type":"code","source":["(x_train, y_train), (x_test, y_test) = fashion_mnist.load_data()\n","assert x_train.shape == (60000, 28, 28)\n","assert x_test.shape == (10000, 28, 28)\n","assert y_train.shape == (60000,)\n","assert y_test.shape == (10000,)\n","\n","concatenated_x = tf.concat([x_train, x_test], axis=0)\n","concatenated_y = tf.concat([y_train, y_test], axis=0)\n","\n","list_of_images = []\n","for i in range(10):\n","  list_of_images.append(concatenated_x[concatenated_y == i]) # (7000, 28, 28)"],"metadata":{"id":"sI9im95v1ECv"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# Normalize the images to [0, 1]\n","x_train = x_train.astype('float32') / 255.\n","x_test = x_test.astype('float32') / 255."],"metadata":{"id":"CJHZ813EwGGO"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# Retrieving the number of images and their dimensions from the train set\n","img_num_train = x_train.shape[0]\n","img_width     = x_train.shape[1]\n","img_height    = x_train.shape[2]\n","\n","# Displaying the train set information\n","print(f\"The MNIST train set contains {img_num_train} images, each with dimensions:\"\n","      f\"\\n(width x height) = ({img_width} x {img_height}) pixels.\")\n","\n","# Retrieving the number of images from the test set\n","img_num_test  = x_test.shape[0]\n","\n","# Displaying the test set information\n","print(f\"The MNIST test set also contains {img_num_test} images with the same dimensions as the train set.\")"],"metadata":{"id":"4i9dpY6EwbLY","colab":{"base_uri":"https://localhost:8080/"},"outputId":"a59d148f-be16-4139-a182-e7aae324387c"},"execution_count":null,"outputs":[{"output_type":"stream","name":"stdout","text":["The MNIST train set contains 60000 images, each with dimensions:\n","(width x height) = (28 x 28) pixels.\n","The MNIST test set also contains 10000 images with the same dimensions as the train set.\n"]}]},{"cell_type":"code","source":["# Define the number of channels: 1 for grayscale images\n","num_channels = 1\n","\n","# Reshape the training and test datasets to include the channel dimension\n","x_train = x_train.reshape(img_num_train, img_height, img_width, num_channels)\n","x_test = x_test.reshape(img_num_test, img_height, img_width, num_channels)\n","concatenated_x_for_training_VAE = tf.concat([x_train, x_test], axis=0)\n","x_for_training_VAE = x_train\n","\n","# Define the input dimensions for the CNN\n","input_dimensions = (img_height, img_width, num_channels)\n","\n","# Display the reshaped dimensions\n","print(f\"Dimensions of each image for the model: (img_height, img_width, num_channels) = {input_dimensions}.\")\n","print(f\"Reshaped training data shape: {x_train.shape}\")\n"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"id":"5MM3NNHJwoMA","outputId":"c97694cf-d918-43d5-fb2e-aead85167249"},"execution_count":null,"outputs":[{"output_type":"stream","name":"stdout","text":["Dimensions of each image for the model: (img_height, img_width, num_channels) = (28, 28, 1).\n","Reshaped training data shape: (60000, 28, 28, 1)\n"]}]},{"cell_type":"code","source":["def visualize_samples(data, sample_indices, figsize=(3.2, 3.2)):\n","    \"\"\"\n","    Visualizes a set of images from the provided dataset.\n","\n","    :param data: The dataset containing the images.\n","    :param sample_indices: A list of indices for the images to be visualized.\n","    :param figsize: Size of the figure for the plots.\n","    \"\"\"\n","    plt.figure(figsize=figsize)\n","\n","    for i, img_index in enumerate(sample_indices):\n","        plt.subplot(2, 2, i + 1)\n","        plt.imshow(data[img_index][:, :, 0], cmap='gray')\n","        plt.title(f'Image index: {img_index}')\n","        plt.axis('off')\n","\n","    plt.tight_layout()\n","    plt.show()"],"metadata":{"id":"TKrk4WN51KKj"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# Randomly sample indices\n","random_indices = random.sample(range(len(x_train)), 4)\n","\n","# Visualize the sampled images\n","visualize_samples(x_train, random_indices)"],"metadata":{"id":"QCi_4v8m1NE9"},"execution_count":null,"outputs":[]},{"cell_type":"markdown","source":["\n","\n","---\n","\n","\n","## Model set up\n","  \n","---\n","\n"],"metadata":{"id":"YgXg8ezlc05-"}},{"cell_type":"markdown","source":["Model Architecture\n","In this section, we will outline the architecture of our Variational Autoencoder (VAE). The VAE model is composed of three main components:\n","\n","\n","1.   Encoder: The encoder's role is to take the input data and compress it into a latent (hidden) space, effectively reducing its dimensionality and capturing the essential features of the data.\n","2.   Latent Space: The latent space represents the compressed representation of the input data. Here, we model the data distribution that we aim to generate from.\n","\n","3.   Decoder: The decoder part of the VAE takes the representation in the latent space and reconstructs the original input data from this compressed form.\n","\n","This structure allows the VAE not only to generate new data similar to the input data but also to learn a meaningful and efficient representation of the input data in the latent space. Let's start by detailing the encoder part of our VAE.\n","\n","**Encoder Architecture**\n","\n","The encoder is a crucial component of the VAE that compresses the input data into a latent space. It consists of several layers, each with specific functions:\n","\n","1. Input Layer: Captures the shape of the input data.\n","2. Convolution Layers: Extracts features from the input.\n","3. Flattening Layer: Transforms the output of the convolution layers into a 1D tensor.\n","4. Dense Layer: Further processes the features.\n","5. Output Layer: Prepares for transition to the latent space.\n","\n","Note that the latent dimension represents the number of dimensions in the space to which the encoder compresses the input.\n","\n","For Fashion MNIST to MNIST experiment (task 3), we choose a dimensionality of 35.\n","\n"],"metadata":{"id":"xjiHByp2c06A"}},{"cell_type":"code","source":["latent_space_dim = 35"],"metadata":{"id":"Z64GvQ8rc06B"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# Input Layer\n","# Defines the shape of the input data for the encoder.\n","encoder_input_layer = Input(shape=input_dimensions, name='encoder_input_layer')"],"metadata":{"id":"PF_k7FJTc06B"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# Convolution Layers\n","# Applies convolution operations to extract features from the input image.\n","encoder_layer = Conv2D(128, 5, padding='same', activation='relu')(encoder_input_layer)\n","encoder_layer = Conv2D(128, 3, padding='same', activation='relu')(encoder_layer)\n","encoder_layer = Conv2D(64, 3, padding='same', strides=2, activation='relu')(encoder_layer)\n","encoder_layer = Conv2D(64, 3, padding='same', activation='relu')(encoder_layer)\n","encoder_layer = Conv2D(64, 3, padding='same', activation='relu')(encoder_layer)\n","encoder_layer = Conv2D(64, 3, padding='same', activation='relu')(encoder_layer)\n","encoder_layer = Conv2D(64, 3, padding='same', activation='relu')(encoder_layer)\n","\n","enc_shape = tf.keras.backend.int_shape(encoder_layer)\n","\n","# Note on Strides:\n","# Strides define the step size of the filter as it moves across the image. Here, a stride of 2 reduces the spatial dimensions of the output."],"metadata":{"id":"x4OdhUn55MF7"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# Flattening Layer\n","# Converts the 3D output of convolution layers into a 1D tensor for dense layers.\n","encoder_layer = Flatten()(encoder_layer)"],"metadata":{"id":"cJR7iO2fc06C"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# Dense Layer\n","# A fully connected layer that combines extracted features and performs further learning.\n","encoder_layer = Dense(64, activation='relu')(encoder_layer)"],"metadata":{"id":"f7yyu4IVc06C"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# Output Layer for Encoder\n","# Prepares the encoded data for transition into the latent space, approximating a probability distribution.\n","mu_layer = Dense(latent_space_dim, name='latent_mu')(encoder_layer)\n","sigma_layer = Dense(latent_space_dim, name='latent_sigma')(encoder_layer)\n","\n","# Storing the output shape for use in the decoder\n","encoder_output_shape = (None, 64) # K.int_shape(encoder_layer)\n","print(f\"Output shape of encoder: {encoder_output_shape}\")"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"outputId":"7a636739-e5aa-470a-f5bd-3d44bd783c1e","id":"6tExgEi9c06C"},"execution_count":null,"outputs":[{"output_type":"stream","name":"stdout","text":["Output shape of encoder: (None, 64)\n"]}]},{"cell_type":"markdown","source":["**Latent Space and Reparameterization Trick**\n","\n","\n","The reparameterization trick is a fundamental concept in training Variational Autoencoders. It allows us to backpropagate through random sampling processes, which are inherently non-differentiable.\n","\n","\n","The Challenge: Directly sampling from the Gaussian distribution defined by $\\mu$ and $\\sigma$ is non-differentiable, posing a challenge for backpropagation.\n","\n","The Solution: We sample from a standard normal distribution and transform this sample using $\\mu$ and $\\sigma$. The transformed sample $z=\\sigma \\epsilon + \\mu$ (where $\\epsilon$ is a random gaussian sample) is differentiable with respect to $\\mu$ and $\\sigma$."],"metadata":{"id":"7JDDEwpAc06C"}},{"cell_type":"code","source":["### Implementing the Reparameterization Trick\n","def sample_z(args):\n","    \"\"\"\n","    Generate a sample from the Gaussian distribution defined by args=(mu, sigma).\n","\n","    Args:\n","    mu_layer:    The mean of the Gaussian distribution.\n","    sigma_layer: The log standard deviation of the Gaussian distribution.\n","\n","    Returns:\n","    A sample from the Gaussian distribution.\n","    \"\"\"\n","    mu_layer, sigma_layer = args\n","    batch_size = tf.shape(mu_layer)[0]\n","    dim = tf.shape(mu_layer)[1]\n","    # Generate a random sample from a standard normal distribution with the same shape\n","    epsilon = tf.random.normal(shape=(batch_size, dim))\n","    # Scale and shift the sample by mu and sigma\n","    return mu_layer + tf.exp(sigma_layer / 2) * epsilon"],"metadata":{"id":"FZaFgmlec06C"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# Creating the 'z' layer using the Lambda layer to apply the reparameterization trick\n","z = Lambda(sample_z, output_shape=(latent_space_dim,), name='z')([mu_layer, sigma_layer])\n","\n","# Note on Lambda Layer:\n","# The Lambda layer in Keras allows us to apply arbitrary expressions that are differentiable."],"metadata":{"id":"Wqn6bR51c06C"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# Building the encoder model\n","encoder_model = Model(encoder_input_layer, [mu_layer, sigma_layer, z], name='encoder_model')\n","\n","# # Save the model for future use\n","# save_path=os.getcwd()\n","# encoder_model.save(save_path + '/encoder_model_MNIST_dim_15.h5')\n","\n","# Display the model summary\n","print(encoder_model.summary())\n","\n"],"metadata":{"id":"3LBNtHVgc06D"},"execution_count":null,"outputs":[]},{"cell_type":"markdown","source":["**Decoder Architecture**\n","\n","The decoder is the component of the VAE that reconstructs the data from the latent space representation. It mirrors the encoder in reverse, progressively upscaling the compressed data back to its original dimension. The decoder consists of the following key steps:\n","\n","Input Layer: Starts with the latent space representation.\n","\n","Dense and Reshape Layers: Upscales the compressed data to a higher dimension suitable for convolutional operations.\n","\n","Deconvolutional (Conv2DTranspose) Layers: Further upscales and\n","refines the data to reconstruct the original input.\n"],"metadata":{"id":"vV7R8FcFc06D"}},{"cell_type":"code","source":["# Decoder Input Layer\n","decoder_input_layer = Input(shape=(latent_space_dim,), name='decoder_input_layer')"],"metadata":{"id":"Ll-vZ9NPc06D"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# Initial Dense Layer\n","# The number of units is derived from the last convolutional layer of the encoder\n","num_units = np.prod(enc_shape[1:]) # 14 * 14 * 64\n","decoder_dense_layer = Dense(num_units, activation='relu')(decoder_input_layer)\n","\n","# Reshaping Layer\n","# The dense layer's output is reshaped to match the last convolutional layer's output shape in the encoder\n","reshape_dims = (14, 14, 64)\n","decoder_layer = Reshape(reshape_dims)(decoder_dense_layer)\n","\n","decoder_layer = Conv2DTranspose(64, 3, padding='same', activation='relu')(decoder_layer)\n","decoder_layer = Conv2DTranspose(64, 3, padding='same', activation='relu')(decoder_layer)\n","decoder_layer = Conv2DTranspose(64, 3, padding='same', activation='relu')(decoder_layer)\n","decoder_layer = Conv2DTranspose(64, 3, padding='same', activation='relu')(decoder_layer)\n","decoder_layer = Conv2DTranspose(64, 3, strides=2, padding='same', activation='relu')(decoder_layer)\n","decoder_layer = Conv2DTranspose(128, 3, padding='same', activation='relu')(decoder_layer)\n","decoder_layer = Conv2DTranspose(128, 5, padding='same', activation='relu')(decoder_layer)\n","decoder_out_layer = Conv2DTranspose(1, 5, padding='same', activation='relu')(decoder_layer)"],"metadata":{"id":"RxmaNbKCc06D"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# Building the Decoder Model\n","decoder_model = Model(decoder_input_layer, decoder_out_layer, name='decoder_model')"],"metadata":{"id":"H0-XwcyOc06D"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["decoder_model.summary()"],"metadata":{"id":"VKt5o6ZSc06D","collapsed":true},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# Reconstructed Output from Decoder\n","reconstructed_output = decoder_model(z)\n","\n","reconstructed_model = Model(encoder_input_layer, reconstructed_output, name='reconstructed_model')\n","\n","print(f\"The type  of 'reconstructed_output' is: {type(reconstructed_output)}\")\n","print(f\"The shape of 'reconstructed_output' is: {reconstructed_output.shape}\")"],"metadata":{"id":"CBkm3tJNc06D"},"execution_count":null,"outputs":[]},{"cell_type":"markdown","source":["**VAE Loss Function**\n","\n","The loss function for a VAE is a combination of reconstruction loss and the KL divergence. The reconstruction loss ensures the decoded samples resemble the original inputs, while the KL divergence loss ensures the latent space distribution approximates a normal distribution."],"metadata":{"id":"n7UYDbKic06D"}},{"cell_type":"code","source":["# Adding the loss computation layer to the model\n","vae_loss_output = VAELossLayer()([encoder_input_layer, reconstructed_output, mu_layer, sigma_layer])\n","\n","print(f\"The type of 'vae_loss_output' is: {type(vae_loss_output)}\")\n","print(f\"The shape of 'vae_loss_output' is: {vae_loss_output.shape}\")"],"metadata":{"colab":{"base_uri":"https://localhost:8080/"},"outputId":"a37206de-1b64-4912-b20b-e327387dcddd","id":"dmrARFhpc06D"},"execution_count":null,"outputs":[{"output_type":"stream","name":"stdout","text":["The type of 'vae_loss_output' is: <class 'keras.src.backend.common.keras_tensor.KerasTensor'>\n","The shape of 'vae_loss_output' is: (None, 28, 28, 1)\n"]}]},{"cell_type":"code","source":["final_vae_model = Model(encoder_input_layer, vae_loss_output, name='vae_model')"],"metadata":{"id":"7CvQqU6Bc06E"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# Compile the final VAE model\n","# The optimizer is set to 'adam', and the loss is already defined within the model\n","opt = keras.optimizers.Adam(learning_rate=0.0001)\n","final_vae_model.compile(optimizer=opt, loss=None)\n","\n","# Displaying the summary of the final VAE model\n","print(final_vae_model.summary())"],"metadata":{"id":"qMLR_wuic06E"},"execution_count":null,"outputs":[]},{"cell_type":"markdown","source":["\n","---\n","\n","\n","## Training new version\n","\n","\n","---\n","\n"],"metadata":{"id":"KUCRQ-UfdaLn"}},{"cell_type":"code","source":["# Training the Variational Autoencoder with Callbacks\n","\n","save_path = os.path.join(os.getcwd(), 'model_data_d{}_beta100_01'.format(latent_space_dim))\n","\n","callbacks = [\n","    EarlyStopping(monitor='val_loss', patience=15),\n","    ModelCheckpoint(save_path+'/best_model_dim_{}_fmnist.h5'.format(latent_space_dim), monitor='val_loss', save_best_only=True)\n","]\n","\n","# Fitting the model to the data # combine train & test data\n","history = final_vae_model.fit(\n","    x_for_training_VAE, None,\n","    epochs=300,\n","    batch_size=32,\n","    validation_split=0.2,\n","    callbacks=callbacks\n",")"],"metadata":{"id":"n1Y1mSVydaLo"},"execution_count":null,"outputs":[]},{"cell_type":"markdown","source":["\n","\n","\n","---\n","\n","## Visualization\n","\n","---\n","\n"],"metadata":{"id":"lBSZSvO-2QxJ"}},{"cell_type":"code","source":["from tensorflow.keras.models import load_model\n","\n","trained_model = load_model('best_model_dim_{}.h5'.format(latent_space_dim), custom_objects={\"sample_z\": sample_z, \"VAELossLayer\": VAELossLayer})"],"metadata":{"id":"vC41z9tq2QxK"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# Encoder_mu\n","# Assume 'encoder_input' is the first input and 'z_mean' is an intermediate layer\n","encoder_input = trained_model.input\n","mu_layer = trained_model.get_layer('latent_mu')\n","mu_output = mu_layer.output\n","\n","# Recreate the encoder model\n","encoder_mu = Model(inputs=encoder_input, outputs=mu_output)\n","\n","# Encoder_sigma\n","# Assume 'encoder_input' is the first input and 'z_mean' is an intermediate layer\n","encoder_input = trained_model.input\n","sigma_layer = trained_model.get_layer('latent_sigma')\n","sigma_output = sigma_layer.output\n","\n","# Recreate the encoder model\n","encoder_sigma = Model(inputs=encoder_input, outputs=sigma_output)\n","\n","# Decoder\n","trained_decoder = trained_model.get_layer('decoder_model')"],"metadata":{"id":"7absgwWH2QxK"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["\n","index=88\n","\n","for k in range(10):\n","\n","  X_test = list_of_images[k].numpy()/255.\n","\n","  img = X_test[index]\n","\n","  encoded_mu_i = encoder_mu.predict(tf.reshape(img, (1, 28, 28, 1)))\n","  encoded_sigma_i = encoder_sigma.predict(tf.reshape(img, (1, 28, 28, 1)))\n","  epsilon_i = tf.random.normal(shape=(1, latent_space_dim))\n","  encoded_image = encoded_mu_i + tf.exp(encoded_sigma_i / 2) * epsilon_i\n","  reconstructed_img_vae = trained_decoder.predict(encoded_image)\n","\n","  plt.figure(1)\n","  plt.subplot(221)\n","  plt.imshow(X_test[index].reshape(28,28))\n","  plt.subplot(222)\n","  plt.imshow(reconstructed_img_vae.reshape(28,28))\n","\n","  plt.show()\n"],"metadata":{"id":"AJxLNk2_LiQz"},"execution_count":null,"outputs":[]},{"cell_type":"code","source":["# Example: load 900 random Fashion-MNIST images\n","# Replace this with your actual images array of shape (900, 28, 28)\n","# For demonstration, we'll use random noise images\n","images = np.random.rand(900, 28, 28)\n","\n","# Create a 30x30 grid of subplots\n","fig, axes = plt.subplots(nrows=30, ncols=30, figsize=(20, 20))\n","plt.subplots_adjust(wspace=0.1, hspace=0.1)\n","\n","count = 0\n","for i in range(30):\n","    for j in range(30):\n","        k = int(count/3)\n","        r = count%3\n","\n","        X_test = list_of_images[k].numpy()/255.\n","        img = X_test[30*r+j]\n","\n","        encoded_mu_i = encoder_mu.predict(tf.reshape(img, (1, 28, 28, 1)))\n","        encoded_sigma_i = encoder_sigma.predict(tf.reshape(img, (1, 28, 28, 1)))\n","        epsilon_i = tf.random.normal(shape=(1, latent_space_dim))\n","        encoded_image = encoded_mu_i + tf.exp(encoded_sigma_i / 2) * epsilon_i\n","        reconstructed_img_vae = trained_decoder.predict(encoded_image)\n","\n","        ax = axes[i, j]\n","        ax.imshow(reconstructed_img_vae.reshape(28, 28), cmap='gray')\n","        ax.axis('off')\n","    count+=1\n","\n","plt.tight_layout()\n","plt.show()\n"],"metadata":{"id":"PM6Y-cQOR_aw"},"execution_count":null,"outputs":[]}]}