cychitivav/neuralNetwork.py

## neuralNetwork.py
import numpy as np

# Activation function and its derivative (sigmoid)
def sigmoid(x):
    return 1 / (1 + np.exp(-x))
def sigmoid_derivative(x):
    return sigmoid(x) * (1 - sigmoid(x))

# Error function (Mean Squared Error) and its derivative
def MSE(yBar, y):
    return 0.5 * np.sum((yBar - y)**2)
def MSE_derivative(yBar, y):
    return y - yBar


# Class for a neural network
class NeuralNetwork:
    def __init__(self, L=[2, 1]):
        # L is a list of the number of neurons in each layer
        self.L = L

        # W is a list of the weight matrices
        self.W = np.array([np.random.rand(L[i+1], L[i]+1) for i in range(len(L)-1)],
                          dtype=object)

    def forward(self, x):
        """ Forward propagation """

        # List of perceptron outputs after applying the activation function
        a = np.array([np.zeros((self.L[i], x.shape[1])) for i in range(len(self.L))],
                     dtype=object)

        # Input layer
        a[0] = x
        for l in range(1, len(a)):
            # Weighted sum of inputs (including bias row)
            z = self.W[l-1] @ np.vstack((np.ones((1,x.shape[1])), a[l-1]))

            # Apply activation function
            a[l] = sigmoid(z)

        return a

    def backward(self, yBar, a):
        """ Backward propagation """
        # Derivative for the last layer
        delta = MSE_derivative(yBar, a[-1]) * sigmoid_derivative(a[-1])

        grad = np.zeros_like(self.W)
        for l in range(len(self.W)-1, -1, -1):
            # Gradient for the current layer
            grad[l] = delta @ np.vstack((np.ones((1,a[l].shape[1])), a[l])).T

            # Derivative for the previous layer
            delta = self.W[l][:, 1:].T @ delta * sigmoid_derivative(a[l])

        return grad

    def train(self, x, yBar, lr=0.5, epochs=80, tol=1e-3):
        """ Train the neural network """
        for ep in range(epochs):
            # With the current weights, calculate the output
            a = self.forward(x)

            # Calculate the gradient with backward propagation
            grad = self.backward(yBar, a)

            # Update weights
            self.W -= lr * grad

            # Calculate the error and check if it is below the tolerance
            e = MSE(yBar, a[-1])
            print(f"Epoch {ep} error: {e}")
            if e < tol:
                break

    def predict(self, x):
        return self.forward(x)[-1]


if __name__ == "__main__":
    # -------------- Test 1 (XOR) ---------------- #
    nn = NeuralNetwork([2, 2, 1])

    inputs = np.array([[0, 0, 1, 1],
                       [0, 1, 0, 1]])
    outputs = np.array([[0, 1, 1, 0]])

    # -------------- Test 2  ---------------- #
    # nn = NeuralNetwork([3, 5, 7, 2])

    # inputs = np.array([[2],
    #                    [1],
    #                    [4]])
    # outputs = np.array([[0.5],
    #                     [0.7]])

    # -------------- Train  ---------------- #
    nn.train(inputs, outputs, lr=1.5, epochs=10000, tol=1e-3)
    print("Predict:\n", nn.predict(x=inputs))
	import numpy as np

	# Activation function and its derivative (sigmoid)
	def sigmoid(x):
	return 1 / (1 + np.exp(-x))
	def sigmoid_derivative(x):
	return sigmoid(x) * (1 - sigmoid(x))

	# Error function (Mean Squared Error) and its derivative
	def MSE(yBar, y):
	return 0.5 * np.sum((yBar - y)**2)
	def MSE_derivative(yBar, y):
	return y - yBar


	# Class for a neural network
	class NeuralNetwork:
	def __init__(self, L=[2, 1]):
	# L is a list of the number of neurons in each layer
	self.L = L

	# W is a list of the weight matrices
	self.W = np.array([np.random.rand(L[i+1], L[i]+1) for i in range(len(L)-1)],
	dtype=object)

	def forward(self, x):
	""" Forward propagation """

	# List of perceptron outputs after applying the activation function
	a = np.array([np.zeros((self.L[i], x.shape[1])) for i in range(len(self.L))],
	dtype=object)

	# Input layer
	a[0] = x
	for l in range(1, len(a)):
	# Weighted sum of inputs (including bias row)
	z = self.W[l-1] @ np.vstack((np.ones((1,x.shape[1])), a[l-1]))

	# Apply activation function
	a[l] = sigmoid(z)

	return a

	def backward(self, yBar, a):
	""" Backward propagation """
	# Derivative for the last layer
	delta = MSE_derivative(yBar, a[-1]) * sigmoid_derivative(a[-1])

	grad = np.zeros_like(self.W)
	for l in range(len(self.W)-1, -1, -1):
	# Gradient for the current layer
	grad[l] = delta @ np.vstack((np.ones((1,a[l].shape[1])), a[l])).T

	# Derivative for the previous layer
	delta = self.W[l][:, 1:].T @ delta * sigmoid_derivative(a[l])

	return grad

	def train(self, x, yBar, lr=0.5, epochs=80, tol=1e-3):
	""" Train the neural network """
	for ep in range(epochs):
	# With the current weights, calculate the output
	a = self.forward(x)

	# Calculate the gradient with backward propagation
	grad = self.backward(yBar, a)

	# Update weights
	self.W -= lr * grad

	# Calculate the error and check if it is below the tolerance
	e = MSE(yBar, a[-1])
	print(f"Epoch {ep} error: {e}")
	if e < tol:
	break

	def predict(self, x):
	return self.forward(x)[-1]


	if __name__ == "__main__":
	# -------------- Test 1 (XOR) ---------------- #
	nn = NeuralNetwork([2, 2, 1])

	inputs = np.array([[0, 0, 1, 1],
	[0, 1, 0, 1]])
	outputs = np.array([[0, 1, 1, 0]])

	# -------------- Test 2 ---------------- #
	# nn = NeuralNetwork([3, 5, 7, 2])

	# inputs = np.array([[2],
	# [1],
	# [4]])
	# outputs = np.array([[0.5],
	# [0.7]])

	# -------------- Train ---------------- #
	nn.train(inputs, outputs, lr=1.5, epochs=10000, tol=1e-3)
	print("Predict:\n", nn.predict(x=inputs))