Error analysis on classifications of handwritten digits#

To perform error analysis, the predict method for the different sets of data (training, validation, and testing) is required. The following code snippets present a clean way of measuring all three metrics on all three sets at once for Naive Bayes, Decision Tree and SVM models trained by the handwritten digits dataset.

Importing libraries and packages#

# Mathematical operations and data manipulation
import pandas as pd

# Dataset
from sklearn.datasets import load_digits

# Models
from sklearn.model_selection import train_test_split
from sklearn.naive_bayes import GaussianNB
from sklearn.tree import DecisionTreeClassifier
from sklearn.svm import SVC
from sklearn.metrics import accuracy_score, precision_score, recall_score

# Warnings
import warnings

warnings.filterwarnings("ignore")

Set paths#

# Path to datasets directory
data_path = "./datasets"
# Path to assets directory (for saving results to)
assets_path = "./assets"

Loading dataset#

sklearn.datasets.load_digits - The output is a dictionary-like object, which separates the features (callable as data) from the target (callable as target) into two attributes.

dataset = load_digits()

Partitioning dataset#

# Convert each attribute (data and target) into a Pandas DataFrame
X = pd.DataFrame(dataset.data)
Y = pd.DataFrame(dataset.target)

print("Shape of X: ", X.shape)
print("Shape of Y: ", Y.shape)

Shape of X:  (1797, 64)
Shape of Y:  (1797, 1)

X.head()

	0	1	2	3	4	5	6	7	8	9	...	54	55	56	57	58	59	60	61	62	63
0	0.0	0.0	5.0	13.0	9.0	1.0	0.0	0.0	0.0	0.0	...	0.0	0.0	0.0	0.0	6.0	13.0	10.0	0.0	0.0	0.0
1	0.0	0.0	0.0	12.0	13.0	5.0	0.0	0.0	0.0	0.0	...	0.0	0.0	0.0	0.0	0.0	11.0	16.0	10.0	0.0	0.0
2	0.0	0.0	0.0	4.0	15.0	12.0	0.0	0.0	0.0	0.0	...	5.0	0.0	0.0	0.0	0.0	3.0	11.0	16.0	9.0	0.0
3	0.0	0.0	7.0	15.0	13.0	1.0	0.0	0.0	0.0	8.0	...	9.0	0.0	0.0	0.0	7.0	13.0	13.0	9.0	0.0	0.0
4	0.0	0.0	0.0	1.0	11.0	0.0	0.0	0.0	0.0	0.0	...	0.0	0.0	0.0	0.0	0.0	2.0	16.0	4.0	0.0	0.0

5 rows × 64 columns

# First split of the data using the train_test_split function
X_train, X_test, Y_train, Y_test = train_test_split(
    X, Y, test_size=0.2, random_state=0
)

print("Shape of X_train: ", X_train.shape)
print("Shape of X_test: ", X_test.shape)
print("Shape of Y_train: ", Y.shape)
print("Shape of Y_test: ", Y_test.shape)

Shape of X_train:  (1437, 64)
Shape of X_test:  (360, 64)
Shape of Y_train:  (1797, 1)
Shape of Y_test:  (360, 1)

# Second split for a validation set (dev set): toobtain a dev set
# that's the same shape as the test set, it is necessary to calculate
# the proportion of the size of the test set over the size of the
# train set before creating a validation set.
dev_size = X_test.shape[0] / X_train.shape[0]
print(dev_size)

0.25052192066805845

X_train, X_dev, Y_train, Y_dev = train_test_split(
    X_train, Y_train, test_size=dev_size
)

print("Shape of X_train: ", X_train.shape)
print("Shape of Y_train: ", Y_train.shape)
print("Shape of X_dev: ", X_dev.shape)
print("Shape of Y_dev: ", Y_dev.shape)
print("Shape of X_test: ", X_test.shape)
print("Shape of Y_test: ", Y_test.shape)

Shape of X_train:  (1077, 64)
Shape of Y_train:  (1077, 1)
Shape of X_dev:  (360, 64)
Shape of Y_dev:  (360, 1)
Shape of X_test:  (360, 64)
Shape of Y_test:  (360, 1)

Naïve Bayes algorithm#

model_NB = GaussianNB()
model_NB.fit(X_train, Y_train)

GaussianNB()

In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.

pred_1 = model_NB.predict(
    [
        [
            0.0,
            0.0,
            5.0,
            13.0,
            9.0,
            1.0,
            0.0,
            0.0,
            0.0,
            0.0,
            13.0,
            15.0,
            10.0,
            15.0,
            5.0,
            0.0,
            0.0,
            3.0,
            15.0,
            2.0,
            0.0,
            11.0,
            8.0,
            0.0,
            0.0,
            4.0,
            12.0,
            0.0,
            0.0,
            8.0,
            8.0,
            0.0,
            0.0,
            5.0,
            8.0,
            0.0,
            0.0,
            9.0,
            8.0,
            0.0,
            0.0,
            4.0,
            11.0,
            0.0,
            1.0,
            12.0,
            7.0,
            0.0,
            0.0,
            2.0,
            14.0,
            5.0,
            10.0,
            12.0,
            0.0,
            0.0,
            0.0,
            0.0,
            6.0,
            13.0,
            10.0,
            0.0,
            0.0,
            0.0,
        ]
    ]
)
print(pred_1)

[0]

Decision tree algorithm#

model_tree = DecisionTreeClassifier(random_state=101)
model_tree.fit(X_train, Y_train)

DecisionTreeClassifier(random_state=101)

In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.

pred_2 = model_tree.predict(
    [
        [
            0.0,
            0.0,
            5.0,
            13.0,
            9.0,
            1.0,
            0.0,
            0.0,
            0.0,
            0.0,
            13.0,
            15.0,
            10.0,
            15.0,
            5.0,
            0.0,
            0.0,
            3.0,
            15.0,
            2.0,
            0.0,
            11.0,
            8.0,
            0.0,
            0.0,
            4.0,
            12.0,
            0.0,
            0.0,
            8.0,
            8.0,
            0.0,
            0.0,
            5.0,
            8.0,
            0.0,
            0.0,
            9.0,
            8.0,
            0.0,
            0.0,
            4.0,
            11.0,
            0.0,
            1.0,
            12.0,
            7.0,
            0.0,
            0.0,
            2.0,
            14.0,
            5.0,
            10.0,
            12.0,
            0.0,
            0.0,
            0.0,
            0.0,
            6.0,
            13.0,
            10.0,
            0.0,
            0.0,
            0.0,
        ]
    ]
)
print(pred_2)

[0]

Support vector machine algorithm#

model_svm = SVC(random_state=101)
model_svm.fit(X_train, Y_train)

SVC(random_state=101)

In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
On GitHub, the HTML representation is unable to render, please try loading this page with nbviewer.org.

pred_3 = model_svm.predict(
    [
        [
            0.0,
            0.0,
            5.0,
            13.0,
            9.0,
            1.0,
            0.0,
            0.0,
            0.0,
            0.0,
            13.0,
            15.0,
            10.0,
            15.0,
            5.0,
            0.0,
            0.0,
            3.0,
            15.0,
            2.0,
            0.0,
            11.0,
            8.0,
            0.0,
            0.0,
            4.0,
            12.0,
            0.0,
            0.0,
            8.0,
            8.0,
            0.0,
            0.0,
            5.0,
            8.0,
            0.0,
            0.0,
            9.0,
            8.0,
            0.0,
            0.0,
            4.0,
            11.0,
            0.0,
            1.0,
            12.0,
            7.0,
            0.0,
            0.0,
            2.0,
            14.0,
            5.0,
            10.0,
            12.0,
            0.0,
            0.0,
            0.0,
            0.0,
            6.0,
            13.0,
            10.0,
            0.0,
            0.0,
            0.0,
        ]
    ]
)
print(pred_3)

[0]

Error analysis#

X_sets = [X_train, X_dev, X_test]
Y_sets = [Y_train, Y_dev, Y_test]

metrics = {
    "NB": {"Acc": [], "Pre": [], "Rec": []},
    "DT": {"Acc": [], "Pre": [], "Rec": []},
    "SVM": {"Acc": [], "Pre": [], "Rec": []},
}

The default value for the argument ‘average’ in precision_score and recall_score is ‘binary’. And this is a multi-class classification. ‘weighted’ calculates metrics for each label, and find their average weighted by support (the number of true instances for each label).

for i in range(0, len(X_sets)):
    pred_NB = model_NB.predict(X_sets[i])
    metrics["NB"]["Acc"].append(accuracy_score(Y_sets[i], pred_NB))
    metrics["NB"]["Pre"].append(
        precision_score(Y_sets[i], pred_NB, average="weighted")
    )
    metrics["NB"]["Rec"].append(
        recall_score(Y_sets[i], pred_NB, average="weighted")
    )

    pred_tree = model_tree.predict(X_sets[i])
    metrics["DT"]["Acc"].append(accuracy_score(Y_sets[i], pred_tree))
    metrics["DT"]["Pre"].append(
        precision_score(Y_sets[i], pred_tree, average="weighted")
    )
    metrics["DT"]["Rec"].append(
        recall_score(Y_sets[i], pred_tree, average="weighted")
    )

    pred_svm = model_svm.predict(X_sets[i])
    metrics["SVM"]["Acc"].append(accuracy_score(Y_sets[i], pred_svm))
    metrics["SVM"]["Pre"].append(
        precision_score(Y_sets[i], pred_svm, average="weighted")
    )
    metrics["SVM"]["Rec"].append(
        recall_score(Y_sets[i], pred_svm, average="weighted")
    )

print(metrics)

{'NB': {'Acc': [0.8774373259052924, 0.8527777777777777, 0.8416666666666667], 'Pre': [0.894594794327501, 0.8707830700894467, 0.8718887380991854], 'Rec': [0.8774373259052924, 0.8527777777777777, 0.8416666666666667]}, 'DT': {'Acc': [1.0, 0.8638888888888889, 0.8861111111111111], 'Pre': [1.0, 0.8693356298220537, 0.8890506509622977], 'Rec': [1.0, 0.8638888888888889, 0.8861111111111111]}, 'SVM': {'Acc': [0.9962859795728877, 0.9805555555555555, 0.9888888888888889], 'Pre': [0.996302725482844, 0.9809229390681004, 0.9888966049382717], 'Rec': [0.9962859795728877, 0.9805555555555555, 0.9888888888888889]}}