Thimira/lenet_mnist_keras.py

## lenet_mnist_keras.py
# How to use
#
# Train the model and save the model weights
# python lenet_mnist_keras.py --train-model 1 --save-trained 1
#
# Train the model and save the model wights to a give directory
# python lenet_mnist_keras.py --train-model 1 --save-trained 1 --weights data/lenet_weights.hdf5
#
# Evaluate the model from pre-trained model wights
# python lenet_mnist_keras.py
#
# Evaluate the model from pre-trained model wights from a give directory
# python lenet_mnist_keras.py --weights data/lenet_weights.hdf5

# import the necessary packages
from keras.datasets import mnist
from keras.optimizers import SGD
from keras.utils import np_utils

# imports used to build the deep learning model
from keras.models import Sequential
from keras.layers.convolutional import Conv2D
from keras.layers.convolutional import MaxPooling2D
from keras.layers.core import Activation
from keras.layers.core import Flatten
from keras.layers.core import Dense

import numpy as np
import argparse
import cv2
import matplotlib.pyplot as plt

# Setup the argument parser to parse out command line arguments
ap = argparse.ArgumentParser()
ap.add_argument("-t", "--train-model", type=int, default=-1,
                help="(optional) Whether the model should be trained on the MNIST dataset. Defaults to no")
ap.add_argument("-s", "--save-trained", type=int, default=-1,
                help="(optional) Whether the trained models weights should be saved." +
                "Overwrites existing weights file with the same name. Use with caution. Defaults to no")
ap.add_argument("-w", "--weights", type=str, default="data/lenet_weights.hdf5",
                help="(optional) Path to the weights file. Defaults to 'data/lenet_weights.hdf5'")
args = vars(ap.parse_args())


def build_lenet(width, height, depth, classes, weightsPath=None):
    # Initialize the model
    model = Sequential()

    # The first set of CONV => RELU => POOL layers
    model.add(Conv2D(20, (5, 5), padding="same",
                     input_shape=(height, width, depth)))
    model.add(Activation("relu"))
    model.add(MaxPooling2D(pool_size=(2, 2), strides=(2, 2)))

    # The second set of CONV => RELU => POOL layers
    model.add(Conv2D(50, (5, 5), padding="same"))
    model.add(Activation("relu"))
    model.add(MaxPooling2D(pool_size=(2, 2), strides=(2, 2)))

    # The set of FC => RELU layers
    model.add(Flatten())
    model.add(Dense(500))
    model.add(Activation("relu"))

    # The softmax classifier
    model.add(Dense(classes))
    model.add(Activation("softmax"))

    # If a weights path is supplied, then load the weights
    if weightsPath is not None:
        model.load_weights(weightsPath)

    # Return the constructed network architecture
    return model


def graph_training_history(history):
    plt.figure(1)

    # summarize history for accuracy

    plt.subplot(211)
    plt.plot(history.history['acc'])
    plt.plot(history.history['val_acc'])
    plt.title('model accuracy')
    plt.ylabel('accuracy')
    plt.xlabel('epoch')
    plt.legend(['train', 'test'], loc='upper left')

    # summarize history for loss

    plt.subplot(212)
    plt.plot(history.history['loss'])
    plt.plot(history.history['val_loss'])
    plt.title('model loss')
    plt.ylabel('loss')
    plt.xlabel('epoch')
    plt.legend(['train', 'test'], loc='upper left')

    plt.show()


# Get the MNIST dataset from Keras datasets
# If this is the first time you are fetching the dataset, it will be downloaded
# File size will be ~10MB, and will placed at ~/.keras/datasets/mnist.npz
print("[INFO] Loading the MNIST dataset...")
(trainData, trainLabels), (testData, testLabels) = mnist.load_data()
# The data is already in the form of numpy arrays,
# and already split to training and testing datasets

# Reshape the data matrix from (samples, height, width) to (samples, height, width, depth)
# Depth (i.e. channels) is 1 since MNIST only has grayscale images
trainData = trainData[:, :, :, np.newaxis]
testData = testData[:, :, :, np.newaxis]

# Rescale the data from values between [0 - 255] to [0 - 1.0]
trainData = trainData / 255.0
testData = testData / 255.0

# The labels comes as a single digit, indicating the class.
# But we need a categorical vector as the label. So we transform it.
# So that,
# '0' will become [1, 0, 0, 0, 0, 0, 0, 0, 0, 0]
# '1' will become [0, 1, 0, 0, 0, 0, 0, 0, 0, 0]
# '2' will become [0, 0, 1, 0, 0, 0, 0, 0, 0, 0]
# and so on...
trainLabels = np_utils.to_categorical(trainLabels, 10)
testLabels = np_utils.to_categorical(testLabels, 10)

# Build and Compile the model
print("[INFO] Building and compiling the LeNet model...")
opt = SGD(lr=0.01)
model = build_lenet(width=28, height=28, depth=1, classes=10,
                    weightsPath=args["weights"] if args["train_model"] <= 0 else None)
model.compile(loss="categorical_crossentropy",
              optimizer=opt, metrics=["accuracy"])

# Check the argument whether to train the model
if args["train_model"] > 0:
    print("[INFO] Training the model...")

    history = model.fit(trainData, trainLabels,
                        batch_size=128,
                        epochs=20,
                        validation_data=(testData, testLabels),
                        verbose=1)

    # Use the test data to evaluate the model
    print("[INFO] Evaluating the model...")

    (loss, accuracy) = model.evaluate(
        testData, testLabels, batch_size=128, verbose=1)

    print("[INFO] accuracy: {:.2f}%".format(accuracy * 100))

    # Visualize the training history
    graph_training_history(history)

# Check the argument on whether to save the model weights to file
if args["save_trained"] > 0:
    print("[INFO] Saving the model weights to file...")
    model.save_weights(args["weights"], overwrite=True)

# Training of the model is now complete

# Randomly select a few samples from the test dataset to evaluate
for i in np.random.choice(np.arange(0, len(testLabels)), size=(10,)):
    # Use the model to classify the digit
    probs = model.predict(testData[np.newaxis, i])
    prediction = probs.argmax(axis=1)

    # Convert the digit data to a color image
    image = (testData[i] * 255).astype("uint8")
    image = cv2.cvtColor(image, cv2.COLOR_GRAY2RGB)

    # The images are in 28x28 size. Much too small to see properly
    # So, we resize them to 280x280 for viewing
    image = cv2.resize(image, (280, 280), interpolation=cv2.INTER_LINEAR)

    # Add the predicted value on to the image
    cv2.putText(image, str(prediction[0]), (20, 40),
                cv2.FONT_HERSHEY_DUPLEX, 1.5, (0, 255, 0), 1)

    # Show the image and prediction
    print("[INFO] Predicted: {}, Actual: {}".format(
        prediction[0], np.argmax(testLabels[i])))
    cv2.imshow("Digit", image)
    cv2.waitKey(0)

cv2.destroyAllWindows()
	# How to use
	#
	# Train the model and save the model weights
	# python lenet_mnist_keras.py --train-model 1 --save-trained 1
	#
	# Train the model and save the model wights to a give directory
	# python lenet_mnist_keras.py --train-model 1 --save-trained 1 --weights data/lenet_weights.hdf5
	#
	# Evaluate the model from pre-trained model wights
	# python lenet_mnist_keras.py
	#
	# Evaluate the model from pre-trained model wights from a give directory
	# python lenet_mnist_keras.py --weights data/lenet_weights.hdf5

	# import the necessary packages
	from keras.datasets import mnist
	from keras.optimizers import SGD
	from keras.utils import np_utils

	# imports used to build the deep learning model
	from keras.models import Sequential
	from keras.layers.convolutional import Conv2D
	from keras.layers.convolutional import MaxPooling2D
	from keras.layers.core import Activation
	from keras.layers.core import Flatten
	from keras.layers.core import Dense

	import numpy as np
	import argparse
	import cv2
	import matplotlib.pyplot as plt

	# Setup the argument parser to parse out command line arguments
	ap = argparse.ArgumentParser()
	ap.add_argument("-t", "--train-model", type=int, default=-1,
	help="(optional) Whether the model should be trained on the MNIST dataset. Defaults to no")
	ap.add_argument("-s", "--save-trained", type=int, default=-1,
	help="(optional) Whether the trained models weights should be saved." +
	"Overwrites existing weights file with the same name. Use with caution. Defaults to no")
	ap.add_argument("-w", "--weights", type=str, default="data/lenet_weights.hdf5",
	help="(optional) Path to the weights file. Defaults to 'data/lenet_weights.hdf5'")
	args = vars(ap.parse_args())


	def build_lenet(width, height, depth, classes, weightsPath=None):
	# Initialize the model
	model = Sequential()

	# The first set of CONV => RELU => POOL layers
	model.add(Conv2D(20, (5, 5), padding="same",
	input_shape=(height, width, depth)))
	model.add(Activation("relu"))
	model.add(MaxPooling2D(pool_size=(2, 2), strides=(2, 2)))

	# The second set of CONV => RELU => POOL layers
	model.add(Conv2D(50, (5, 5), padding="same"))
	model.add(Activation("relu"))
	model.add(MaxPooling2D(pool_size=(2, 2), strides=(2, 2)))

	# The set of FC => RELU layers
	model.add(Flatten())
	model.add(Dense(500))
	model.add(Activation("relu"))

	# The softmax classifier
	model.add(Dense(classes))
	model.add(Activation("softmax"))

	# If a weights path is supplied, then load the weights
	if weightsPath is not None:
	model.load_weights(weightsPath)

	# Return the constructed network architecture
	return model


	def graph_training_history(history):
	plt.figure(1)

	# summarize history for accuracy

	plt.subplot(211)
	plt.plot(history.history['acc'])
	plt.plot(history.history['val_acc'])
	plt.title('model accuracy')
	plt.ylabel('accuracy')
	plt.xlabel('epoch')
	plt.legend(['train', 'test'], loc='upper left')

	# summarize history for loss

	plt.subplot(212)
	plt.plot(history.history['loss'])
	plt.plot(history.history['val_loss'])
	plt.title('model loss')
	plt.ylabel('loss')
	plt.xlabel('epoch')
	plt.legend(['train', 'test'], loc='upper left')

	plt.show()


	# Get the MNIST dataset from Keras datasets
	# If this is the first time you are fetching the dataset, it will be downloaded
	# File size will be ~10MB, and will placed at ~/.keras/datasets/mnist.npz
	print("[INFO] Loading the MNIST dataset...")
	(trainData, trainLabels), (testData, testLabels) = mnist.load_data()
	# The data is already in the form of numpy arrays,
	# and already split to training and testing datasets

	# Reshape the data matrix from (samples, height, width) to (samples, height, width, depth)
	# Depth (i.e. channels) is 1 since MNIST only has grayscale images
	trainData = trainData[:, :, :, np.newaxis]
	testData = testData[:, :, :, np.newaxis]

	# Rescale the data from values between [0 - 255] to [0 - 1.0]
	trainData = trainData / 255.0
	testData = testData / 255.0

	# The labels comes as a single digit, indicating the class.
	# But we need a categorical vector as the label. So we transform it.
	# So that,
	# '0' will become [1, 0, 0, 0, 0, 0, 0, 0, 0, 0]
	# '1' will become [0, 1, 0, 0, 0, 0, 0, 0, 0, 0]
	# '2' will become [0, 0, 1, 0, 0, 0, 0, 0, 0, 0]
	# and so on...
	trainLabels = np_utils.to_categorical(trainLabels, 10)
	testLabels = np_utils.to_categorical(testLabels, 10)

	# Build and Compile the model
	print("[INFO] Building and compiling the LeNet model...")
	opt = SGD(lr=0.01)
	model = build_lenet(width=28, height=28, depth=1, classes=10,
	weightsPath=args["weights"] if args["train_model"] <= 0 else None)
	model.compile(loss="categorical_crossentropy",
	optimizer=opt, metrics=["accuracy"])

	# Check the argument whether to train the model
	if args["train_model"] > 0:
	print("[INFO] Training the model...")

	history = model.fit(trainData, trainLabels,
	batch_size=128,
	epochs=20,
	validation_data=(testData, testLabels),
	verbose=1)

	# Use the test data to evaluate the model
	print("[INFO] Evaluating the model...")

	(loss, accuracy) = model.evaluate(
	testData, testLabels, batch_size=128, verbose=1)

	print("[INFO] accuracy: {:.2f}%".format(accuracy * 100))

	# Visualize the training history
	graph_training_history(history)

	# Check the argument on whether to save the model weights to file
	if args["save_trained"] > 0:
	print("[INFO] Saving the model weights to file...")
	model.save_weights(args["weights"], overwrite=True)

	# Training of the model is now complete

	# Randomly select a few samples from the test dataset to evaluate
	for i in np.random.choice(np.arange(0, len(testLabels)), size=(10,)):
	# Use the model to classify the digit
	probs = model.predict(testData[np.newaxis, i])
	prediction = probs.argmax(axis=1)

	# Convert the digit data to a color image
	image = (testData[i] * 255).astype("uint8")
	image = cv2.cvtColor(image, cv2.COLOR_GRAY2RGB)

	# The images are in 28x28 size. Much too small to see properly
	# So, we resize them to 280x280 for viewing
	image = cv2.resize(image, (280, 280), interpolation=cv2.INTER_LINEAR)

	# Add the predicted value on to the image
	cv2.putText(image, str(prediction[0]), (20, 40),
	cv2.FONT_HERSHEY_DUPLEX, 1.5, (0, 255, 0), 1)

	# Show the image and prediction
	print("[INFO] Predicted: {}, Actual: {}".format(
	prediction[0], np.argmax(testLabels[i])))
	cv2.imshow("Digit", image)
	cv2.waitKey(0)

	cv2.destroyAllWindows()