Preprocessing and Training a CNN on Fashion MNIST Dataset

# Import necessary libraries import numpy as np import matplotlib.pyplot as plt import seaborn as sns from sklearn.model_selection import train_test_split from sklearn.metrics import confusion_matrix import tensorflow as tf from tensorflow.keras.models import Sequential from tensorflow.keras.layers import Conv2D, MaxPooling2D, Flatten, Dense, LSTM # a. Get the data (train_images, train_labels), (test_images, test_labels) = tf.keras.datasets.fashion_mnist.load_data() train_yagnam = {'images': train_images, 'labels': train_labels} test_yagnam = {'images': test_images, 'labels': test_labels} # b. Initial Exploration # 1. Display the size of the training and testing dataset print("Size of the training dataset:", len(train_yagnam['images'])) print("Size of the testing dataset:", len(test_yagnam['images'])) # 2. Display the image resolution (dimension) of the input images image_resolution = train_yagnam['images'].shape[1:] print("Image Resolution (Dimension):", image_resolution) # 3. Display the largest pixel value in the dataset using numpy.amax() largest_pixel_value = np.amax(train_yagnam['images']) print("Largest Pixel Value in the Dataset:", largest_pixel_value)

# c. Data Pre-preprocessing # 1. Normalize pixel values to a range between 0-1 train_yagnam['images'] = train_yagnam['images'] / 255.0 test_yagnam['images'] = test_yagnam['images'] / 255.0 # 2. One-hot encode the labels train_yagnam['labels'] = tf.keras.utils.to_categorical(train_yagnam['labels']) test_yagnam['labels'] = tf.keras.utils.to_categorical(test_yagnam['labels']) # 3. Display the shape of train_yagnam['labels'] and test_yagnam['labels'] print("Shape of train_yagnam['labels']:", train_yagnam['labels'].shape) print("Shape of test_yagnam['labels']:", test_yagnam['labels'].shape) # Number of possible labels num_possible_labels = train_yagnam['labels'].shape[1] print("Number of Possible Labels in the Dataset:", num_possible_labels) # d. Visualization # 1. Create a function to display an image with its true label def display_image(image, true_label): plt.imshow(image, cmap='gray') plt.title(f'True Label: {true_label}') plt.axis('off') plt.show() # 2. Plot the first 12 data samples in the training dataset fig, axes = plt.subplots(nrows=4, ncols=3, figsize=(8, 8)) for i in range(12):

ax = axes[i // 3, i % 3] display_image(train_yagnam['images'][i], true_label=np.argmax(train_yagnam['labels'][i])) ax.axis('off') plt.tight_layout() plt.show() # e. Training Data Preparation # 1. Split the training dataset using Sklearn's train_test_split x_train_yagnam, x_val_yagnam, y_train_yagnam, y_val_yagnam = train_test_split( train_yagnam['images'], train_yagnam['labels'], test_size=0.2, random_state=19 ) # f. Build, Train, and Validate CNN Model # Assuming your original image shape is (28, 28) original_image_shape = (28, 28) # Reshape the input data to add a channel dimension x_train_yagnam = x_train_yagnam.reshape(-1, original_image_shape[0], original_image_shape[1], 1) x_val_yagnam = x_val_yagnam.reshape(-1, original_image_shape[0], original_image_shape[1], 1) test_yagnam['images'] = test_yagnam['images'].reshape(-1, original_image_shape[0], original_image_shape[1], 1) # Assuming your labels are already one-hot encoded num_possible_labels = y_train_yagnam.shape[1]

Your preview ends here