Classifying cats versus dogs with data generators#

Keras provides an API called data generator to load and transform data in batches. Data generators are also very useful for image classification. The cats and dogs image dataset comes in the form of a folder with predefined structures for the training and testing sets and for the different classes (all images that belong to a class are stored in the same folder). The data generator API will be able to understand this structure and feed the CNN model properly with the relevant images and corresponding information.

raise SystemExit("Stop right there!");

An exception has occurred, use %tb to see the full traceback.

SystemExit: Stop right there!

Importing libraries and packages#

# System
import os
import pathlib

# Mathematical operations and data manipulation
import numpy as np

# Modelling
import tensorflow as tf
from tensorflow.keras import layers
from tensorflow.keras.preprocessing.image import ImageDataGenerator

os.environ["TF_CPP_MIN_LOG_LEVEL"] = "2"

Set paths#

path = pathlib.Path(r"./datasets/cats_and_dogs_filtered")
# Path to cats_and_dogs_filtered directory
train_path = path / "train"
# Path to validation directory
validation_path = path / "validation"

train_cats_path = train_path / "cats"
train_dogs_path = train_path / "dogs"
validation_cats_path = validation_path / "cats"
validation_dogs_path = validation_path / "dogs"

# Creating two variables called total_train and total_val that will
# get the number of images for the training and validation sets
total_train = len(os.listdir(train_cats_path)) + len(
    os.listdir(train_dogs_path)
)
total_val = len(os.listdir(validation_cats_path)) + len(
    os.listdir(validation_dogs_path)
)

Data generators#

# Instantiating two ImageDataGenerator classes
data_gen_train = ImageDataGenerator(rescale=1.0 / 255)
data_gen_valid = ImageDataGenerator(rescale=1.0 / 255)

batch_size = 16
img_height = 100
img_width = 100

# Create data generators
train_generator = data_gen_train.flow_from_directory(
    train_path,
    target_size=(img_height, img_width),
    batch_size=batch_size,
    shuffle=True,
    class_mode="binary",
)

valid_generator = data_gen_valid.flow_from_directory(
    validation_path,
    target_size=(img_height, img_width),
    batch_size=batch_size,
    shuffle=True,
    class_mode="binary",
)

Found 2000 images belonging to 2 classes.
Found 1000 images belonging to 2 classes.

Training of the network#

# Setting 8 as the seed for numpy and tensorflow
np.random.seed(8)
tf.random.set_seed(8)

model = tf.keras.Sequential(
    [
        layers.Conv2D(
            64, 3, activation="relu", input_shape=(img_height, img_width, 3)
        ),
        layers.MaxPooling2D(),
        layers.Conv2D(128, 3, activation="relu"),
        layers.MaxPooling2D(),
        layers.Flatten(),
        layers.Dense(128, activation="relu"),
        layers.Dense(1, activation="sigmoid"),
    ]
)

optimizer = tf.keras.optimizers.Adam(0.001)

# Providing training parameters using the compile method
model.compile(
    loss="binary_crossentropy", optimizer=optimizer, metrics=["accuracy"]
)

# Inspecting the model configuration using the summary function
model.summary()

Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #   
=================================================================
conv2d (Conv2D)              (None, 98, 98, 64)        1792      
_________________________________________________________________
max_pooling2d (MaxPooling2D) (None, 49, 49, 64)        0         
_________________________________________________________________
conv2d_1 (Conv2D)            (None, 47, 47, 128)       73856     
_________________________________________________________________
max_pooling2d_1 (MaxPooling2 (None, 23, 23, 128)       0         
_________________________________________________________________
flatten (Flatten)            (None, 67712)             0         
_________________________________________________________________
dense (Dense)                (None, 128)               8667264   
_________________________________________________________________
dense_1 (Dense)              (None, 1)                 129       
=================================================================
Total params: 8,743,041
Trainable params: 8,743,041
Non-trainable params: 0
_________________________________________________________________

# Train the model by calling the fit method
model.fit(
    train_generator,
    epochs=5,
    steps_per_epoch=total_train // batch_size,
    validation_data=valid_generator,
    validation_steps=total_val // batch_size,
)

Epoch 1/5
125/125 [==============================] - 30s 234ms/step - loss: 0.7874 - accuracy: 0.5450 - val_loss: 0.6732 - val_accuracy: 0.5716
Epoch 2/5
125/125 [==============================] - 32s 255ms/step - loss: 0.6360 - accuracy: 0.6439 - val_loss: 0.6324 - val_accuracy: 0.6421
Epoch 3/5
125/125 [==============================] - 32s 259ms/step - loss: 0.5711 - accuracy: 0.6842 - val_loss: 0.6285 - val_accuracy: 0.6593
Epoch 4/5
125/125 [==============================] - 32s 259ms/step - loss: 0.4588 - accuracy: 0.7856 - val_loss: 0.6368 - val_accuracy: 0.7016
Epoch 5/5
125/125 [==============================] - 33s 262ms/step - loss: 0.3320 - accuracy: 0.8542 - val_loss: 0.6925 - val_accuracy: 0.6774

<tensorflow.python.keras.callbacks.History at 0x7f56082ba400>

The model is overfitting quite a lot.

Table of Contents

Books

Classifying cats versus dogs with data generators#

Importing libraries and packages#

Set paths#

Data generators#

Training of the network#