Workshop: Machine Learning - Part 2 - Image Classification

16 May 2021, Carlos Pena

This post is a conversion from an old workshop of mine. For a better view, please check the notebook.

from matplotlib import pyplot as plt
from glob import glob
import numpy as np
import cv2
import pickle

from sklearn.metrics import pairwise_distances
from sklearn.preprocessing import OneHotEncoder
from sklearn.preprocessing import MinMaxScaler
from sklearn.neighbors import KNeighborsClassifier
from sklearn.svm import LinearSVC
from sklearn.metrics import accuracy_score, f1_score
from sklearn.ensemble import RandomForestClassifier
from skimage.feature import hog

import keras
from keras import datasets
from keras import layers
from keras.models import Sequential,Input,Model
from keras.layers import Dense, Dropout, Flatten
from keras.layers import Conv2D, MaxPooling2D
from keras.layers.normalization import BatchNormalization
from keras.layers.advanced_activations import LeakyReLU

onehot = OneHotEncoder()
minMax = MinMaxScaler()

def print_metrics(y_test, y_pred, label=''):
    if len(y_test.shape) == 2:
        if y_test.shape[1] == 1:
            y_test = y_test[:, 0]
        elif y_test.shape[0] == 1:
            y_test = y_test[0]
        else:
            print("?")

    acc = accuracy_score(y_test, y_pred)
    f1  = f1_score(y_test, y_pred, average='macro')
    # Calculate metrics for each label, and find their unweighted mean.

    print(f"{label}: Accuracy {acc:0.3f}\t F1 {f1:0.3f}")

Image Classification

Source: https://www.kdnuggets.com/2018/09/object-detection-image-classification-yolo.html

ImageNet

The ImageNet Large Scale Visual Recognition Challenge (ILSVRC) Source: Deng, Jia, et al. “Imagenet: A large-scale hierarchical image database.” 2009 IEEE conference on computer vision and pattern recognition. Ieee, 2009.

CIFAR-10

The CIFAR-10 dataset consists of 60000 32x32 colour images in 10 classes, with 6000 images per class. There are 50000 training images and 10000 test images.

data: a 10000x3072 numpy array of uint8s.
labels: a list of 10000 numbers in the range 0-9.

label2str = {0:"airplane", 1:"automobile", 2:"bird",
             3:"cat", 4:"deer", 5:"dog", 6:"frog",
             7:"horse", 8:"ship", 9:"truck"}

(x_train, y_train), (x_test, y_test) = datasets.cifar10.load_data()

idx = 3
plt.figure(figsize=(8,8))

plt.subplot(221);plt.axis('off')
train_label = y_train[idx][0]
plt.title(f'Train - {label2str[train_label]} ({train_label})')
plt.imshow(x_train[idx])

plt.subplot(222);plt.axis('off')
test_label = y_test[idx][0]
plt.title(f'Train - {label2str[test_label]} ({test_label})')
plt.imshow(x_test[idx])

idx = 100
plt.subplot(223);plt.axis('off')
train_label = y_train[idx][0]
plt.title(f'Test - {label2str[train_label]} ({train_label})')
plt.imshow(x_train[idx])

plt.subplot(224);plt.axis('off')
test_label = y_test[idx][0]
plt.title(f'Test - {label2str[test_label]} ({test_label})')
plt.imshow(x_test[idx]);

png

y_train_hot = onehot.fit_transform(y_train).toarray()
y_test_hot  = onehot.transform(y_test).toarray()

x_train_norm = x_train/255
x_test_norm = x_test/255

x_train_row = x_train_norm.reshape(len(x_train_norm), -1)
x_test_row = x_test_norm.reshape(len(x_test_norm), -1)

Random Choise

%%time
y_test_random = np.random.randint(0, 10, size=len(x_test))

    CPU times: user 443 µs, sys: 0 ns, total: 443 µs
    Wall time: 291 µs

print_metrics(y_test, y_test_random, 'Random')

    Random: Accuracy 0.097   F1 0.096

Closest Element

knn = KNeighborsClassifier(n_neighbors=1, n_jobs=6)

%%time
knn = knn.fit(x_train_row, y_train[:, 0])
    CPU times: user 12.3 s, sys: 61.4 ms, total: 12.4 s
    Wall time: 12.5 s

%%time
y_test_pred_knn = knn.predict(x_test_row)
    CPU times: user 42min 20s, sys: 2.04 s, total: 42min 23s
    Wall time: 7min 26s

y_test_pred_knn.shape, y_test.shape
((10000,), (10000, 1))

print_metrics(y_test, y_test_pred_knn, 'KNN')
    KNN: Accuracy 0.354  F1 0.349

Features Extraction

HOG (Histogram of Oriented Gradients)

img = x_test[297, ..., 0]
plt.figure(figsize=(8, 4))
plt.subplot(121);plt.title("Original Image")
plt.imshow(img, cmap='gray');plt.axis('off')

plt.subplot(122);plt.title("Histogram")
plt.hist(img.ravel(), bins=range(0, 256));

png

img = x_test[297, ..., 0]
gx = cv2.Sobel(img, cv2.CV_32F, 1, 0, ksize=1)
gy = cv2.Sobel(img, cv2.CV_32F, 0, 1, ksize=1)

mag, angle = cv2.cartToPolar(gx, gy, angleInDegrees=True)

plt.figure(figsize=(24, 8))
plt.subplot(161);plt.axis('off')
plt.imshow(img);plt.title("Original Image")
plt.subplot(162);plt.axis('off')
plt.imshow(gx);plt.title("GX")
plt.subplot(163);plt.axis('off')
plt.imshow(gy);plt.title("GY")
plt.subplot(164);plt.axis('off')
plt.imshow(mag);plt.title("Magnitude")
plt.subplot(165);plt.axis('off')
plt.imshow(angle);plt.title("Angle")

Source: https://learnopencv.com/histogram-of-oriented-gradients/

x_train_hog = np.array([hog(src) for src in x_train])
x_test_hog = np.array([hog(src) for src in x_test])

x_test.shape, x_test_hog.shape
    ((10000, 32, 32, 3), (10000, 324))

%%time
knn_hog = knn.fit(x_train_hog, y_train[:, 0])
    CPU times: user 1.48 s, sys: 7.87 ms, total: 1.49 s
    Wall time: 1.49 s

%%time
y_test_pred_knn_hog = knn_hog.predict(x_test_hog)

    CPU times: user 6min 14s, sys: 455 ms, total: 6min 15s
    Wall time: 1min 5s

y_test_pred_knn_hog.shape, y_test.shape
    ((10000,), (10000, 1))

print_metrics(y_test, y_test_pred_knn_hog, 'KNN HOG')
    KNN HOG: Accuracy 0.512  F1 0.506

Forest

forest = RandomForestClassifier(n_jobs=6)

%%time
forest = forest.fit(x_train_row, y_train[:, 0])

    CPU times: user 3min 18s, sys: 796 ms, total: 3min 19s
    Wall time: 35.5 s

%%time
y_test_pred_forest = forest.predict(x_test_row)

    CPU times: user 686 ms, sys: 82.4 ms, total: 768 ms
    Wall time: 308 ms

print_metrics(y_test, y_test_pred_forest, 'Forest')
    Forest: Accuracy 0.468   F1 0.464

Forest + HOG

forest_hog = RandomForestClassifier(n_jobs=6)

%%time
forest_hog = forest_hog.fit(x_train_hog, y_train[:, 0])
    CPU times: user 1min 23s, sys: 104 ms, total: 1min 23s
    Wall time: 14.8 s

%%time
y_test_pred_forest_hog = forest_hog.predict(x_test_hog)
    CPU times: user 275 ms, sys: 15.7 ms, total: 291 ms
    Wall time: 106 ms

print_metrics(y_test, y_test_pred_forest_hog, 'Forest HOG')
    Forest HOG: Accuracy 0.526   F1 0.522

Row

model_row = keras.Sequential()
model_row.add(layers.Dense(units=512, activation='relu'))
model_row.add(layers.Dense(units=120, activation='relu'))
model_row.add(layers.Dense(units=84, activation='relu'))
model_row.add(layers.Dense(units=10, activation = 'softmax'))
model_row.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])

train_row = x_train_norm.reshape(len(x_train_norm), -1)
test_row = x_test_norm.reshape(len(x_test_norm), -1)
model_row.fit(train_row, y_train_hot, epochs=100, batch_size=256, validation_data=(test_row, y_test_hot))

    Epoch 1/100
    196/196 [=====] - 2s 9ms/step - loss: 0.3391 - accuracy: 0.2142 - val_loss: 0.2769 - val_accuracy: 0.3559
    Epoch 2/100
    196/196 [=====] - 2s 8ms/step - loss: 0.2727 - accuracy: 0.3656 - val_loss: 0.2684 - val_accuracy: 0.3567
    ...
    Epoch 99/100
    196/196 [=====] - 2s 10ms/step - loss: 0.0940 - accuracy: 0.8188 - val_loss: 0.3307 - val_accuracy: 0.5135
    Epoch 100/100
    196/196 [=====] - 2s 10ms/step - loss: 0.0896 - accuracy: 0.8264 - val_loss: 0.3270 - val_accuracy: 0.5166

plt.figure(figsize=(8, 4))
plt.subplot(121)
plt.plot(model_row.history.history['loss'], label="Train Loss")
plt.plot(model_row.history.history['val_loss'], label="Val Loss")
plt.xlabel("Epoch")
plt.legend()

plt.subplot(122)
plt.plot(model_row.history.history['accuracy'], label="Train accuracy")
plt.plot(model_row.history.history['val_accuracy'], label="Val accuracy")
plt.xlabel("Epoch")
plt.legend()

png

As Image

model = keras.Sequential()
model.add(layers.Conv2D(filters=6, kernel_size=(3, 3), activation='relu', input_shape=(32,32,3)))
model.add(layers.AveragePooling2D())
model.add(layers.Conv2D(filters=16, kernel_size=(3, 3), activation='relu'))
model.add(layers.AveragePooling2D())
model.add(layers.Flatten())
model.add(layers.Dense(units=120, activation='relu'))
model.add(layers.Dense(units=84, activation='relu'))
model.add(layers.Dense(units=10, activation = 'softmax'))
model.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])

model.fit(x_train_norm, y_train_hot, epochs=200, batch_size=256, validation_data=(x_train_norm, y_train_hot))


    Epoch 1/200
    196/196 [==============================] - 6s 28ms/step - loss: 0.3777 - accuracy: 0.1622 - val_loss: 0.2633 - val_accuracy: 0.3735
    Epoch 2/200
    196/196 [==============================] - 5s 24ms/step - loss: 0.2585 - accuracy: 0.3877 - val_loss: 0.2447 - val_accuracy: 0.4250
    ...
    196/196 [==============================] - 5s 24ms/step - loss: 0.0563 - accuracy: 0.9122 - val_loss: 0.0547 - val_accuracy: 0.9165
    Epoch 200/200
    196/196 [==============================] - 4s 23ms/step - loss: 0.0580 - accuracy: 0.9077 - val_loss: 0.0559 - val_accuracy: 0.9137

plt.figure(figsize=(8, 4))
plt.subplot(121)
plt.plot(model.history.history['loss'], label="Train Loss")
plt.plot(model.history.history['val_loss'], label="Val Loss")
plt.xlabel("Epoch")
plt.legend()

plt.subplot(122)
plt.plot(model.history.history['accuracy'], label="Train accuracy")
plt.plot(model.history.history['val_accuracy'], label="Val accuracy")
plt.xlabel("Epoch")
plt.legend()

png

Similarity

sample_labels = [f"{idx} "+label2str[lab] for idx, lab in  enumerate(y_test[:,0])]
extractor     = keras.Model(inputs=model.inputs,
                            outputs=[layer.output for layer in model.layers])
features      = extractor(x_test_norm)
distances     = pairwise_distances(features[-2])

view_sample = 10
dist_norm = distances[:view_sample, :view_sample]
view_labels = sample_labels[:view_sample]
plt.figure(figsize=(12, 12))
plt.imshow(dist_norm)
plt.colorbar()
plt.yticks(range(view_sample), view_labels);
plt.xticks(range(view_sample), view_labels);
plt.title("Distance")

png

for id_sample in [1, 6159, 100, 200, 1000, 3268]:
    dist_argsort = distances[id_sample].argsort()
    similar = np.array(sample_labels)[dist_argsort]
    dist_ship = distances[id_sample][dist_argsort]

    len_data = len(x_test)
    plt.figure(figsize=(20, 7))
    for id_col in range(0, 6):
        plt.subplot(2,6, id_col+1)
        plt.title(f"Similar - {similar[id_col]}\n{dist_ship[id_col]:0.2f}")
        plt.imshow(x_test[dist_argsort[id_col]]);plt.axis('off')

    for id_col in range(0, 6):
        idx = len_data-id_col-1
        plt.subplot(2, 6, id_col+7)
        plt.title(f"Dissimilar - {similar[idx]}\n{dist_ship[idx]:0.2f}")
        plt.imshow(x_test[dist_argsort[idx]]);plt.axis('off')