from google.colab import drive
drive.mount('/content/drive')

Drive already mounted at /content/drive; to attempt to forcibly remount, call drive.mount("/content/drive", force_remount=True).

import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import os
import zipfile

# For Data Visualization
import cv2
import seaborn as sns

# For Model Building
import tensorflow as tf
import keras
from tensorflow.keras.models import Sequential, Model                                                                       # Sequential API for sequential model
from tensorflow.keras.layers import Dense, Dropout, Flatten                                                                 # Importing different layers
from tensorflow.keras.layers import Conv2D, MaxPooling2D, BatchNormalization, Activation, Input, LeakyReLU, Activation
from tensorflow.keras import backend                                                                                        # This helps to clear memory to prevent overflow
from tensorflow.keras.utils import to_categorical                                                                           # To perform one-hot encoding
from tensorflow.keras.optimizers import RMSprop, Adam, SGD                                                                  # Optimizers for optimizing the model
from tensorflow.keras.callbacks import EarlyStopping                                                                        # Regularization method to prevent the overfitting - stops the model if accuracy doesnt improve after a defined number of epoch
from tensorflow.keras.callbacks import ModelCheckpoint                                                                      # Save the best model
from tensorflow.keras import losses, optimizers
from tensorflow.keras.preprocessing.image import load_img
from google.colab.patches import cv2_imshow

import random

# Unzip the data - We only need to do this once, comment this out if it has already been done

# Storing the path of the data file from the Google drive
path = '/content/drive/MyDrive/MIT - Data Sciences/Colab Notebooks/Week_Six_-_Deep_Learning/Guided_Project_Food_Image_Classification/Food_Data.zip'

# The data is provided as a zip file so we need to extract the files from the zip file
with zipfile.ZipFile(path, 'r') as zip_ref:
    zip_ref.extractall()                      # Places data in the Content folder

# Storing the training path in a variable named DATADIR, and storing the unique categories/labels in a list

DATADIR = "/content/Food_Data/Training"                                        # Path of training data after unzipping
CATEGORIES = ["Bread", "Soup", "Vegetable-Fruit"]                              # Storing all the categories in 'CATEGORIES' variable
IMG_SIZE = 150                                                                 # Defining the size of the image to 150

# Here we will be using a user defined function create_training_data() to extract the images from the directory
training_data = []

# Storing all the training images
def create_training_data():
    for category in CATEGORIES:                                                # Looping over each category from the CATEGORIES list
        path = os.path.join(DATADIR, category)                                 # Joining images with labels
        class_num = category

        for img in os.listdir(path):
            img_array = cv2.imread(os.path.join(path, img))                    # Reading the data

            new_array = cv2.resize(img_array, (IMG_SIZE, IMG_SIZE))            # Resizing the images

            training_data.append([new_array, class_num])                       # Appending both the images and labels

create_training_data()

DATADIR_test = "/content/Food_Data/Testing"                                    # Path of training data after unzipping
CATEGORIES =  ["Bread", "Soup", "Vegetable-Fruit"]                             # Storing all the categories in categories variable
IMG_SIZE = 150                                                                 # Defining the size of the image to 150

# Here we will be using a user defined function create_testing_data() to extract the images from the directory
testing_data = []

# Storing all the testing images
def create_testing_data():
    for category in CATEGORIES:                                                # Looping over each category from the CATEGORIES list
        path = os.path.join(DATADIR_test, category)                            # Joining images with labels
        class_num = category

        for img in os.listdir(path):
            img_array = cv2.imread(os.path.join(path, img))                    # Reading the data

            new_array = cv2.resize(img_array, (IMG_SIZE, IMG_SIZE))            # Resizing the images

            testing_data.append([new_array, class_num])                        # Appending both the images and labels

create_testing_data()

bread_imgs = [fn for fn in os.listdir(f'{DATADIR}/{CATEGORIES[0]}') ]
select_bread = np.random.choice(bread_imgs, 9, replace = False)               # replace = True would allow the same image to be part of the random pool again

fig = plt.figure(figsize = (10, 10))

for i in range(9):
    ax = fig.add_subplot(4, 3, i + 1)

    fp = f'{DATADIR}/{CATEGORIES[0]}/{select_bread[i]}'

    fn = load_img(fp, target_size = (150, 150))

    plt.imshow(fn, cmap = 'Greys_r')

    plt.axis('off')

plt.show()

soup_imgs = [fn for fn in os.listdir(f'{DATADIR}/{CATEGORIES[1]}') ]
select_soup = np.random.choice(soup_imgs, 9, replace = False)

fig = plt.figure(figsize = (10, 10))

for i in range(9):
    ax = fig.add_subplot(4, 3, i + 1)

    fp = f'{DATADIR}/{CATEGORIES[1]}/{select_soup[i]}'

    fn = load_img(fp, target_size = (150, 150))

    plt.imshow(fn, cmap = 'Greys_r')

    plt.axis('off')

plt.show()

vegetable_fruit_imgs = [fn for fn in os.listdir(f'{DATADIR}/{CATEGORIES[2]}') ]
select_vegetable_fruit = np.random.choice(vegetable_fruit_imgs, 9, replace = False)

fig = plt.figure(figsize = (10, 10))

for i in range(9):
    ax = fig.add_subplot(4, 3, i + 1)

    fp = f'{DATADIR}/{CATEGORIES[2]}/{select_vegetable_fruit[i]}'

    fn = load_img(fp, target_size = (150, 150))

    plt.imshow(fn, cmap = 'Greys_r')

    plt.axis('off')

plt.show()

# Creating two different lists to store the Numpy arrays and the corresponding labels
X_train = []
y_train = []

np.random.shuffle(training_data)                                               # Shuffling data to reduce variance and making sure that model remains general and overfit less
for features, label in training_data:                                          # Iterating over the training data which is generated from the create_training_data() function
    X_train.append(features)                                                   # Appending images into X_train
    y_train.append(label)                                                      # Appending labels into y_train

# Creating two different lists to store the Numpy arrays and the corresponding labels
X_test = []
y_test = []

np.random.shuffle(testing_data)                                                # Shuffling data to reduce variance and making sure that model remains general and overfit less
for features, label in testing_data:                                           # Iterating over the training data which is generated from the create_testing_data() function
    X_test.append(features)                                                    # Appending images into X_test
    y_test.append(label)                                                       # Appending labels into y_test

# Converting the pixel values into Numpy array
X_train = np.array(X_train)
X_test = np.array(X_test)
X_train.shape

(3203, 150, 150, 3)

# Converting the lists into DataFrames
y_train = pd.DataFrame(y_train, columns = ["Label"], dtype = object)
y_test = pd.DataFrame(y_test, columns = ["Label"], dtype = object)

# Printing the value counts of target variable
count = y_train.Label.value_counts()
print(count)

print('*'*10)

count = y_train.Label.value_counts(normalize = True)
print(count)

Label
Soup               1500
Bread               994
Vegetable-Fruit     709
Name: count, dtype: int64
**********
Label
Soup               0.468311
Bread              0.310334
Vegetable-Fruit    0.221355
Name: proportion, dtype: float64

# Normalizing the image data
X_train = X_train/255.0

X_test = X_test/255.0

y_train_encoded = [ ]

for label_name in y_train["Label"]:
    if(label_name == 'Bread'):
        y_train_encoded.append(0)

    if(label_name == 'Soup'):
        y_train_encoded.append(1)

    if(label_name == 'Vegetable-Fruit'):
        y_train_encoded.append(2)

y_train_encoded = to_categorical(y_train_encoded, 3)                           # Convert to one hot encoded
y_train_encoded

array([[1., 0., 0.],
       [0., 0., 1.],
       [0., 1., 0.],
       ...,
       [0., 1., 0.],
       [0., 1., 0.],
       [0., 1., 0.]])

y_test_encoded = [ ]

for label_name in y_test["Label"]:
    if(label_name == 'Bread'):
        y_test_encoded.append(0)

    if(label_name == 'Soup'):
        y_test_encoded.append(1)

    if(label_name == 'Vegetable-Fruit'):
        y_test_encoded.append(2)

y_test_encoded = to_categorical(y_test_encoded, 3)
y_test_encoded

array([[1., 0., 0.],
       [1., 0., 0.],
       [0., 0., 1.],
       ...,
       [0., 1., 0.],
       [1., 0., 0.],
       [1., 0., 0.]])

backend.clear_session()                                                        # Clear the session backend for memory conservation

# Fixing the seed for random number generators so that we can ensure we receive the same output everytime
seed = 42

np.random.seed(seed)
random.seed(seed)
tf.random.set_seed(seed)

# Intializing a sequential model
model = Sequential()

# Adding first conv layer with 64 filters and kernel size 3x3, padding 'same' provides the output size same as the input size
# The input_shape denotes input image dimension
model.add(                                                                     # See OneNote for complete code breakdown
          Conv2D(                                                              # Adds a Convolutional 2D (Conv2D) layer to the model.
                  64,                                                          # Specifies the number of filters (or kernels) in the Conv2D layer
                  (3, 3),                                                      # Defines the kernel size or filter size
                  activation = 'relu',                                         # Applies the ReLU (Rectified Linear Unit) activation function to the output of the Conv2D layer
                  padding = "same",                                            # Specifies the padding strategy. "Same" padding means that the input image is padded with zeros such that the output image has the same dimensions as the input (150x150)
                  input_shape = (150, 150, 3)                                  # Defines the input shape to the Conv2D layer
                  )
          )

# Adding max pooling to reduce the size of output of first conv layer
model.add(                                                                     # See OneNote for complete code breakdown
          MaxPooling2D(                                                        # MaxPooling helps reduce the spatial dimensions (height and width) of the feature maps, reduces computational complexity and helps avoid overfitting
                      (2, 2),                                                  # Specifies the pool size, a 2x2 window will slide over the input feature map
                      padding = 'same'                                         # Ensures that the output feature map retains the same dimensions as the input feature map
                      )
          )

# Adding second conv layer with 32 filters and kernel size 3x3, padding 'same' followed by a Maxpooling2D layer
model.add(Conv2D(32, (3, 3), activation = 'relu', padding = "same"))
model.add(MaxPooling2D((2, 2), padding = 'same'))

# Add third conv layer with 32 filters and kernel size 3x3, padding 'same' followed by a Maxpooling2D layer
model.add(Conv2D(32, (3, 3), activation='relu', padding="same"))
model.add(MaxPooling2D((2, 2), padding = 'same'))

# Flattening the output of the conv layer after max pooling to make it ready for creating dense connections
model.add(Flatten())

# Adding a fully connected dense layer with 100 neurons
model.add(Dense(100, activation = 'relu'))

# Adding the output layer with 3 neurons and activation functions as softmax since this is a multi-class classification problem
model.add(Dense(3, activation = 'softmax'))

# Using SGD Optimizer
opt = SGD(learning_rate = 0.01, momentum = 0.9)                                # Instatiate an optimizer

# Compiling the model
model.compile(optimizer = opt, loss = 'categorical_crossentropy', metrics = ['accuracy'])

# Generating the summary of the model
model.summary()

/usr/local/lib/python3.10/dist-packages/keras/src/layers/convolutional/base_conv.py:107: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(activity_regularizer=activity_regularizer, **kwargs)

Model: "sequential"

┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
┃ Layer (type)                         ┃ Output Shape                ┃         Param # ┃
┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
│ conv2d (Conv2D)                      │ (None, 150, 150, 64)        │           1,792 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ max_pooling2d (MaxPooling2D)         │ (None, 75, 75, 64)          │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ conv2d_1 (Conv2D)                    │ (None, 75, 75, 32)          │          18,464 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ max_pooling2d_1 (MaxPooling2D)       │ (None, 38, 38, 32)          │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ conv2d_2 (Conv2D)                    │ (None, 38, 38, 32)          │           9,248 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ max_pooling2d_2 (MaxPooling2D)       │ (None, 19, 19, 32)          │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ flatten (Flatten)                    │ (None, 11552)               │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dense (Dense)                        │ (None, 100)                 │       1,155,300 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dense_1 (Dense)                      │ (None, 3)                   │             303 │
└──────────────────────────────────────┴─────────────────────────────┴─────────────────┘

 Total params: 1,185,107 (4.52 MB)

 Trainable params: 1,185,107 (4.52 MB)

 Non-trainable params: 0 (0.00 B)

# The following lines of code saves the best model's parameters if training accuracy goes down on further training
es = EarlyStopping(
                  monitor = 'val_loss',                                        # Specifies what metric to monitor during training
                  mode = 'min',                                                # Defines whether the EarlyStopping should stop when the monitored metric is minimized or maximized
                  verbose = 1,                                                 # Controls the level of output in the training logs
                  patience = 5                                                 # Defines how many epochs to wait after the last improvement before stopping
                  )
# mc = ModelCheckpoint('best_model.h5', monitor = 'val_accuracy', mode = 'max', verbose = 1, save_best_only = True)     # Original code contains an error

mc = ModelCheckpoint(                                                          # Corrected code
                    'best_model.keras',
                    monitor = 'val_accuracy',
                    mode = 'max',
                    verbose = 1,
                    save_best_only = True)

# Fitting the model with 30 epochs and validation_split as 10%
history = model.fit(
                    X_train,
                    y_train_encoded,
                    epochs = 60,
                    batch_size= 32,
                    validation_split = 0.10,
                    callbacks = [es, mc]
                    )

Epoch 1/60
91/91 ━━━━━━━━━━━━━━━━━━━━ 0s 39ms/step - accuracy: 0.4704 - loss: 1.0586
Epoch 1: val_accuracy improved from -inf to 0.51090, saving model to best_model.keras
91/91 ━━━━━━━━━━━━━━━━━━━━ 11s 61ms/step - accuracy: 0.4706 - loss: 1.0585 - val_accuracy: 0.5109 - val_loss: 1.0930
Epoch 2/60
89/91 ━━━━━━━━━━━━━━━━━━━━ 0s 24ms/step - accuracy: 0.4852 - loss: 1.0538
Epoch 2: val_accuracy improved from 0.51090 to 0.62617, saving model to best_model.keras
91/91 ━━━━━━━━━━━━━━━━━━━━ 2s 26ms/step - accuracy: 0.4857 - loss: 1.0525 - val_accuracy: 0.6262 - val_loss: 0.8103
Epoch 3/60
89/91 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.5458 - loss: 0.9392
Epoch 3: val_accuracy did not improve from 0.62617
91/91 ━━━━━━━━━━━━━━━━━━━━ 3s 26ms/step - accuracy: 0.5459 - loss: 0.9387 - val_accuracy: 0.5234 - val_loss: 1.0298
Epoch 4/60
91/91 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.5582 - loss: 0.9195
Epoch 4: val_accuracy did not improve from 0.62617
91/91 ━━━━━━━━━━━━━━━━━━━━ 3s 27ms/step - accuracy: 0.5582 - loss: 0.9193 - val_accuracy: 0.5826 - val_loss: 0.8939
Epoch 5/60
91/91 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.5939 - loss: 0.8284
Epoch 5: val_accuracy did not improve from 0.62617
91/91 ━━━━━━━━━━━━━━━━━━━━ 3s 28ms/step - accuracy: 0.5939 - loss: 0.8283 - val_accuracy: 0.5888 - val_loss: 0.8565
Epoch 6/60
91/91 ━━━━━━━━━━━━━━━━━━━━ 0s 24ms/step - accuracy: 0.6086 - loss: 0.7836
Epoch 6: val_accuracy improved from 0.62617 to 0.63240, saving model to best_model.keras
91/91 ━━━━━━━━━━━━━━━━━━━━ 2s 27ms/step - accuracy: 0.6087 - loss: 0.7834 - val_accuracy: 0.6324 - val_loss: 0.7492
Epoch 7/60
91/91 ━━━━━━━━━━━━━━━━━━━━ 0s 24ms/step - accuracy: 0.6366 - loss: 0.7300
Epoch 7: val_accuracy did not improve from 0.63240
91/91 ━━━━━━━━━━━━━━━━━━━━ 2s 26ms/step - accuracy: 0.6368 - loss: 0.7298 - val_accuracy: 0.6168 - val_loss: 0.7717
Epoch 8/60
89/91 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.6642 - loss: 0.6997
Epoch 8: val_accuracy improved from 0.63240 to 0.63863, saving model to best_model.keras
91/91 ━━━━━━━━━━━━━━━━━━━━ 3s 27ms/step - accuracy: 0.6647 - loss: 0.6988 - val_accuracy: 0.6386 - val_loss: 0.7280
Epoch 9/60
89/91 ━━━━━━━━━━━━━━━━━━━━ 0s 24ms/step - accuracy: 0.6887 - loss: 0.6560
Epoch 9: val_accuracy improved from 0.63863 to 0.65732, saving model to best_model.keras
91/91 ━━━━━━━━━━━━━━━━━━━━ 2s 26ms/step - accuracy: 0.6894 - loss: 0.6550 - val_accuracy: 0.6573 - val_loss: 0.7174
Epoch 10/60
89/91 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.7225 - loss: 0.5960
Epoch 10: val_accuracy did not improve from 0.65732
91/91 ━━━━━━━━━━━━━━━━━━━━ 3s 28ms/step - accuracy: 0.7227 - loss: 0.5956 - val_accuracy: 0.6542 - val_loss: 0.7569
Epoch 11/60
88/91 ━━━━━━━━━━━━━━━━━━━━ 0s 25ms/step - accuracy: 0.7229 - loss: 0.5710
Epoch 11: val_accuracy improved from 0.65732 to 0.68536, saving model to best_model.keras
91/91 ━━━━━━━━━━━━━━━━━━━━ 5s 26ms/step - accuracy: 0.7239 - loss: 0.5698 - val_accuracy: 0.6854 - val_loss: 0.9102
Epoch 12/60
90/91 ━━━━━━━━━━━━━━━━━━━━ 0s 24ms/step - accuracy: 0.7845 - loss: 0.4861
Epoch 12: val_accuracy did not improve from 0.68536
91/91 ━━━━━━━━━━━━━━━━━━━━ 2s 25ms/step - accuracy: 0.7848 - loss: 0.4859 - val_accuracy: 0.6449 - val_loss: 1.0035
Epoch 13/60
89/91 ━━━━━━━━━━━━━━━━━━━━ 0s 24ms/step - accuracy: 0.8136 - loss: 0.4587
Epoch 13: val_accuracy did not improve from 0.68536
91/91 ━━━━━━━━━━━━━━━━━━━━ 2s 25ms/step - accuracy: 0.8143 - loss: 0.4573 - val_accuracy: 0.6698 - val_loss: 0.8364
Epoch 14/60
89/91 ━━━━━━━━━━━━━━━━━━━━ 0s 26ms/step - accuracy: 0.8688 - loss: 0.3310
Epoch 14: val_accuracy did not improve from 0.68536
91/91 ━━━━━━━━━━━━━━━━━━━━ 3s 28ms/step - accuracy: 0.8697 - loss: 0.3291 - val_accuracy: 0.6604 - val_loss: 0.9961
Epoch 14: early stopping

# Plotting the training and validation accuracies for each epoch

plt.plot(history.history['accuracy'])
plt.plot(history.history['val_accuracy'])
plt.title('model accuracy')
plt.ylabel('accuracy')
plt.xlabel('epoch')
plt.legend(['train', 'validation'], loc='upper left')
plt.show()

model.evaluate(X_test, (y_test_encoded))

35/35 ━━━━━━━━━━━━━━━━━━━━ 1s 27ms/step - accuracy: 0.6448 - loss: 1.1261

[1.085956335067749, 0.660877525806427]

from sklearn.metrics import classification_report
from sklearn.metrics import confusion_matrix

pred = model.predict(X_test)
pred = np.argmax(pred, axis = 1)
y_true = np.argmax(y_test_encoded, axis = 1)

# Printing the classification report
print(classification_report(y_true, pred))

# Plotting the heatmap using confusion matrix
cm = confusion_matrix(y_true, pred)
plt.figure(figsize = (8, 5))
sns.heatmap(cm, annot = True,  fmt = '.0f', xticklabels = ['Bread', 'Soup', 'Vegetable-Fruit'], yticklabels=['Bread', 'Soup', 'Vegetable-Fruit'])
plt.ylabel('Actual')
plt.xlabel('Predicted')
plt.show()

35/35 ━━━━━━━━━━━━━━━━━━━━ 1s 15ms/step
              precision    recall  f1-score   support

           0       0.64      0.43      0.51       362
           1       0.73      0.75      0.74       500
           2       0.57      0.83      0.67       232

    accuracy                           0.66      1094
   macro avg       0.65      0.67      0.64      1094
weighted avg       0.67      0.66      0.65      1094

from tensorflow.keras import backend
backend.clear_session()

# Fixing the seed for random number generators so that we can ensure we receive the same output everytime
np.random.seed(42)
import random
random.seed(42)
tf.random.set_seed(42)

# Initializing a sequential model
model_2 = Sequential()

# Adding first conv layer with 256 filters and kernel size 5x5, with ReLU activation and padding 'same' provides the output size same as the input size
# The input_shape denotes input image dimension
model_2.add(Conv2D(filters = 256, kernel_size = (5, 5), padding = 'Same', activation = 'relu', input_shape = (150, 150, 3)))

# Adding max pooling to reduce the size of output of first conv layer
model_2.add(MaxPooling2D(pool_size = (2, 2), strides = (2, 2)))

#  Adding dropout to randomly switch off 25% neurons to reduce overfitting
model_2.add(Dropout(0.25))

# Adding second conv layer with 128 filters and with kernel size 5x5 and ReLu activation function
model_2.add(Conv2D(filters = 128, kernel_size = (5, 5), padding = 'Same', activation = 'relu'))

# Adding max pooling to reduce the size of output of first conv layer
model_2.add(MaxPooling2D(pool_size = (2, 2), strides = (2, 2)))

#  Adding dropout to randomly switch off 25% neurons to reduce overfitting
model_2.add(Dropout(0.25))

# Adding third conv layer with 64 filters and with kernel size 3x3 and ReLu activation function
model_2.add(Conv2D(filters = 64, kernel_size = (3, 3), padding = 'Same', activation = 'relu'))

# Adding max pooling to reduce the size of output of first conv layer
model_2.add(MaxPooling2D(pool_size = (2, 2), strides = (2, 2)))

#  Adding dropout to randomly switch off 25% neurons to reduce overfitting
model_2.add(Dropout(0.25))

# Adding fourth conv layer with 32 filters and with kernel size 3x3 and ReLu activation function
model_2.add(Conv2D(filters = 32, kernel_size = (3, 3), padding = 'Same', activation = 'relu'))

# Adding max pooling to reduce the size of output of first conv layer
model_2.add(MaxPooling2D(pool_size = (2, 2), strides = (2, 2)))

#  Adding dropout to randomly switch off 25% neurons to reduce overfitting
model_2.add(Dropout(0.25))

# Flattening the 3-d output of the conv layer after max pooling to make it ready for creating dense connections
model_2.add(Flatten())

# Adding first fully connected dense layer with 64 neurons
model_2.add(Dense(64, activation = "relu"))

# Adding second fully connected dense layer with 32 neurons
model_2.add(Dense(32, activation = "relu"))

# Adding the output layer with 3 neurons and activation functions as softmax since this is a multi-class classification problem
model_2.add(Dense(3, activation = "softmax"))

# Using Adam Optimizer
optimizer = Adam(learning_rate = 0.001)

# Compile the model
model_2.compile(optimizer = optimizer , loss = "categorical_crossentropy", metrics = ["accuracy"])

/usr/local/lib/python3.10/dist-packages/keras/src/layers/convolutional/base_conv.py:107: UserWarning: Do not pass an `input_shape`/`input_dim` argument to a layer. When using Sequential models, prefer using an `Input(shape)` object as the first layer in the model instead.
  super().__init__(activity_regularizer=activity_regularizer, **kwargs)

model_2.summary()

Model: "sequential"

┏━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━━━━━━━━━━━━━┳━━━━━━━━━━━━━━━━━┓
┃ Layer (type)                         ┃ Output Shape                ┃         Param # ┃
┡━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━━━━━━━━━━━━━╇━━━━━━━━━━━━━━━━━┩
│ conv2d (Conv2D)                      │ (None, 150, 150, 256)       │          19,456 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ max_pooling2d (MaxPooling2D)         │ (None, 75, 75, 256)         │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dropout (Dropout)                    │ (None, 75, 75, 256)         │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ conv2d_1 (Conv2D)                    │ (None, 75, 75, 128)         │         819,328 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ max_pooling2d_1 (MaxPooling2D)       │ (None, 37, 37, 128)         │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dropout_1 (Dropout)                  │ (None, 37, 37, 128)         │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ conv2d_2 (Conv2D)                    │ (None, 37, 37, 64)          │          73,792 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ max_pooling2d_2 (MaxPooling2D)       │ (None, 18, 18, 64)          │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dropout_2 (Dropout)                  │ (None, 18, 18, 64)          │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ conv2d_3 (Conv2D)                    │ (None, 18, 18, 32)          │          18,464 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ max_pooling2d_3 (MaxPooling2D)       │ (None, 9, 9, 32)            │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dropout_3 (Dropout)                  │ (None, 9, 9, 32)            │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ flatten (Flatten)                    │ (None, 2592)                │               0 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dense (Dense)                        │ (None, 64)                  │         165,952 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dense_1 (Dense)                      │ (None, 32)                  │           2,080 │
├──────────────────────────────────────┼─────────────────────────────┼─────────────────┤
│ dense_2 (Dense)                      │ (None, 3)                   │              99 │
└──────────────────────────────────────┴─────────────────────────────┴─────────────────┘

 Total params: 1,099,171 (4.19 MB)

 Trainable params: 1,099,171 (4.19 MB)

 Non-trainable params: 0 (0.00 B)

es = EarlyStopping(monitor = 'val_loss', mode = 'min', verbose = 1, patience = 5)
mc = ModelCheckpoint('best_model.keras', monitor = 'val_accuracy', mode = 'max', verbose = 1, save_best_only = True)

'''# There is an error with this code
history=model_2.fit(X_train,
          y_train_encoded,
          epochs = 60,
          batch_size = 32, validation_split = 0.10, use_multiprocessing = True)
'''

history=model_2.fit(
                    X_train,
                    y_train_encoded,
                    epochs = 60,
                    batch_size = 32,
                    validation_split = 0.10,
                    callbacks = [es, mc]
                    )

Epoch 1/60
91/91 ━━━━━━━━━━━━━━━━━━━━ 0s 245ms/step - accuracy: 0.4347 - loss: 1.0847
Epoch 1: val_accuracy improved from -inf to 0.51090, saving model to best_model.keras
91/91 ━━━━━━━━━━━━━━━━━━━━ 49s 323ms/step - accuracy: 0.4349 - loss: 1.0845 - val_accuracy: 0.5109 - val_loss: 1.0238
Epoch 2/60
90/91 ━━━━━━━━━━━━━━━━━━━━ 0s 156ms/step - accuracy: 0.4736 - loss: 1.0476
Epoch 2: val_accuracy improved from 0.51090 to 0.60436, saving model to best_model.keras
91/91 ━━━━━━━━━━━━━━━━━━━━ 49s 160ms/step - accuracy: 0.4735 - loss: 1.0474 - val_accuracy: 0.6044 - val_loss: 0.9109
Epoch 3/60
90/91 ━━━━━━━━━━━━━━━━━━━━ 0s 158ms/step - accuracy: 0.5630 - loss: 0.9060
Epoch 3: val_accuracy did not improve from 0.60436
91/91 ━━━━━━━━━━━━━━━━━━━━ 21s 160ms/step - accuracy: 0.5630 - loss: 0.9056 - val_accuracy: 0.6012 - val_loss: 0.8297
Epoch 4/60
90/91 ━━━━━━━━━━━━━━━━━━━━ 0s 156ms/step - accuracy: 0.5976 - loss: 0.8418
Epoch 4: val_accuracy improved from 0.60436 to 0.62305, saving model to best_model.keras
91/91 ━━━━━━━━━━━━━━━━━━━━ 20s 160ms/step - accuracy: 0.5974 - loss: 0.8417 - val_accuracy: 0.6231 - val_loss: 0.7941
Epoch 5/60
90/91 ━━━━━━━━━━━━━━━━━━━━ 0s 155ms/step - accuracy: 0.6128 - loss: 0.7874
Epoch 5: val_accuracy improved from 0.62305 to 0.64798, saving model to best_model.keras
91/91 ━━━━━━━━━━━━━━━━━━━━ 20s 158ms/step - accuracy: 0.6128 - loss: 0.7870 - val_accuracy: 0.6480 - val_loss: 0.7319
Epoch 6/60
90/91 ━━━━━━━━━━━━━━━━━━━━ 0s 156ms/step - accuracy: 0.6155 - loss: 0.7641
Epoch 6: val_accuracy improved from 0.64798 to 0.65421, saving model to best_model.keras
91/91 ━━━━━━━━━━━━━━━━━━━━ 21s 162ms/step - accuracy: 0.6155 - loss: 0.7639 - val_accuracy: 0.6542 - val_loss: 0.7065
Epoch 7/60
90/91 ━━━━━━━━━━━━━━━━━━━━ 0s 156ms/step - accuracy: 0.6332 - loss: 0.7349
Epoch 7: val_accuracy improved from 0.65421 to 0.67290, saving model to best_model.keras
91/91 ━━━━━━━━━━━━━━━━━━━━ 15s 164ms/step - accuracy: 0.6330 - loss: 0.7349 - val_accuracy: 0.6729 - val_loss: 0.6936
Epoch 8/60
90/91 ━━━━━━━━━━━━━━━━━━━━ 0s 154ms/step - accuracy: 0.6401 - loss: 0.7189
Epoch 8: val_accuracy did not improve from 0.67290
91/91 ━━━━━━━━━━━━━━━━━━━━ 20s 157ms/step - accuracy: 0.6403 - loss: 0.7185 - val_accuracy: 0.6604 - val_loss: 0.6934
Epoch 9/60
90/91 ━━━━━━━━━━━━━━━━━━━━ 0s 158ms/step - accuracy: 0.6984 - loss: 0.6560
Epoch 9: val_accuracy improved from 0.67290 to 0.68224, saving model to best_model.keras
91/91 ━━━━━━━━━━━━━━━━━━━━ 15s 161ms/step - accuracy: 0.6983 - loss: 0.6558 - val_accuracy: 0.6822 - val_loss: 0.6562
Epoch 10/60
90/91 ━━━━━━━━━━━━━━━━━━━━ 0s 155ms/step - accuracy: 0.7311 - loss: 0.5999
Epoch 10: val_accuracy improved from 0.68224 to 0.68536, saving model to best_model.keras
91/91 ━━━━━━━━━━━━━━━━━━━━ 14s 158ms/step - accuracy: 0.7312 - loss: 0.5997 - val_accuracy: 0.6854 - val_loss: 0.6506
Epoch 11/60
90/91 ━━━━━━━━━━━━━━━━━━━━ 0s 154ms/step - accuracy: 0.7646 - loss: 0.5418
Epoch 11: val_accuracy improved from 0.68536 to 0.71340, saving model to best_model.keras
91/91 ━━━━━━━━━━━━━━━━━━━━ 21s 158ms/step - accuracy: 0.7647 - loss: 0.5414 - val_accuracy: 0.7134 - val_loss: 0.6155
Epoch 12/60
90/91 ━━━━━━━━━━━━━━━━━━━━ 0s 156ms/step - accuracy: 0.7906 - loss: 0.4950
Epoch 12: val_accuracy did not improve from 0.71340
91/91 ━━━━━━━━━━━━━━━━━━━━ 20s 158ms/step - accuracy: 0.7907 - loss: 0.4949 - val_accuracy: 0.7040 - val_loss: 0.6468
Epoch 13/60
90/91 ━━━━━━━━━━━━━━━━━━━━ 0s 156ms/step - accuracy: 0.8059 - loss: 0.4513
Epoch 13: val_accuracy improved from 0.71340 to 0.72897, saving model to best_model.keras
91/91 ━━━━━━━━━━━━━━━━━━━━ 21s 164ms/step - accuracy: 0.8061 - loss: 0.4510 - val_accuracy: 0.7290 - val_loss: 0.6031
Epoch 14/60
90/91 ━━━━━━━━━━━━━━━━━━━━ 0s 156ms/step - accuracy: 0.8268 - loss: 0.4075
Epoch 14: val_accuracy did not improve from 0.72897
91/91 ━━━━━━━━━━━━━━━━━━━━ 20s 161ms/step - accuracy: 0.8264 - loss: 0.4082 - val_accuracy: 0.7072 - val_loss: 0.6395
Epoch 15/60
90/91 ━━━━━━━━━━━━━━━━━━━━ 0s 155ms/step - accuracy: 0.8339 - loss: 0.3977
Epoch 15: val_accuracy did not improve from 0.72897
91/91 ━━━━━━━━━━━━━━━━━━━━ 20s 158ms/step - accuracy: 0.8339 - loss: 0.3978 - val_accuracy: 0.6573 - val_loss: 0.8049
Epoch 16/60
90/91 ━━━━━━━━━━━━━━━━━━━━ 0s 155ms/step - accuracy: 0.8262 - loss: 0.4119
Epoch 16: val_accuracy did not improve from 0.72897
91/91 ━━━━━━━━━━━━━━━━━━━━ 20s 158ms/step - accuracy: 0.8263 - loss: 0.4116 - val_accuracy: 0.7165 - val_loss: 0.7693
Epoch 17/60
90/91 ━━━━━━━━━━━━━━━━━━━━ 0s 155ms/step - accuracy: 0.8396 - loss: 0.3647
Epoch 17: val_accuracy did not improve from 0.72897
91/91 ━━━━━━━━━━━━━━━━━━━━ 21s 161ms/step - accuracy: 0.8398 - loss: 0.3644 - val_accuracy: 0.6916 - val_loss: 0.8216
Epoch 18/60
90/91 ━━━━━━━━━━━━━━━━━━━━ 0s 155ms/step - accuracy: 0.8436 - loss: 0.3614
Epoch 18: val_accuracy improved from 0.72897 to 0.75078, saving model to best_model.keras
91/91 ━━━━━━━━━━━━━━━━━━━━ 20s 159ms/step - accuracy: 0.8440 - loss: 0.3609 - val_accuracy: 0.7508 - val_loss: 0.7519
Epoch 18: early stopping

plt.plot(history.history['accuracy'])
plt.plot(history.history['val_accuracy'])
plt.title('model accuracy')
plt.ylabel('accuracy')
plt.xlabel('epoch')
plt.legend(['train', 'validation'], loc = 'upper left')
plt.show()

model_2.evaluate(X_test, y_test_encoded)

35/35 ━━━━━━━━━━━━━━━━━━━━ 3s 98ms/step - accuracy: 0.7329 - loss: 0.7416

[0.6977789402008057, 0.7376599907875061]

from sklearn.metrics import classification_report
from sklearn.metrics import confusion_matrix

pred = model_2.predict(X_test)
pred = np.argmax(pred, axis = 1)
y_true = np.argmax(y_test_encoded, axis = 1)

#Printing the classification report
print(classification_report(y_true, pred))

#Plotting the heatmap using confusion matrix
cm = confusion_matrix(y_true, pred)
plt.figure(figsize = (8, 5))
sns.heatmap(cm, annot = True,  fmt = '.0f', xticklabels = ['Bread', 'Soup', 'Vegetable-Fruit'], yticklabels = ['Bread', 'Soup', 'Vegetable-Fruit'])
plt.ylabel('Actual')
plt.xlabel('Predicted')
plt.show()

35/35 ━━━━━━━━━━━━━━━━━━━━ 2s 40ms/step
              precision    recall  f1-score   support

           0       0.69      0.55      0.61       362
           1       0.71      0.89      0.79       500
           2       0.93      0.70      0.80       232

    accuracy                           0.74      1094
   macro avg       0.78      0.71      0.73      1094
weighted avg       0.75      0.74      0.73      1094

# Plotting the test image
cv2_imshow(X_test[1] * 255)  # Multiplying with 255, because X_test was previously normalized.
i = y_test.Label[1]
i = np.argmax(i)
if(i == 0):
    plt.title("Bread")
if(i == 1):
    plt.title("Soup")
if(i == 2):
    plt.title("Vegetable-Fruit")

plt.axis('off')
plt.show()

# Predicting the test image with the best model and storing the prediction value in res variable
res = model_2.predict(X_test[1].reshape(1, 150, 150, 3))

1/1 ━━━━━━━━━━━━━━━━━━━━ 0s 420ms/step

# Applying argmax on the prediction to get the highest index value
i=np.argmax(res)
if(i == 0):
    print("Bread")
if(i==1):
    print("Soup")
if(i==2):
    print("Vegetable-Fruit")

Bread

# Convert notebook to html
!jupyter nbconvert --to html "/content/drive/MyDrive/MIT - Data Sciences/Colab Notebooks/Week_Six_-_Deep_Learning/Guided_Project_Food_Image_Classification/Food_Image_Classification_Mine.ipynb"

Food Image Classification¶

Context:¶

Objective:¶

Dataset:¶

Mount the Drive¶

Importing the Libraries¶

Importing the Dataset¶

Preparing the Data¶

Training Data¶

Testing Data¶

Visualizing images randomly from each class¶

Bread¶

Soup¶

Vegetable-Fruit¶

Data Preprocessing¶

Checking Distribution of Classes¶

Normalizing the data¶

Encoding Target Variable¶

Model Building¶

Model 1 Architecture:¶

Training the Model¶

Plotting the Training and Validation Accuracies¶

Checking Test Accuracy¶

Plotting Confusion Matrix¶

Model 2 Architecture:¶

Training the Model¶

Plotting the Training and Validation Accuracies¶

Checking Test Accuracy¶

Plotting Confusion Matrix¶

Prediction¶

Conclusion and Recommendations¶