finlytics-hub/LR_batch_GD.py

## LR_batch_GD.py
'''
NORMAL EQUATION
'''
# generate some random numbers (independent variable)
X = 5 * np.random.rand(500,1)
# calculate linearly related (plus some noise) target variable in the form y = 10 + 2x + noise
y = 10 + 2 * X + np.random.randn(500,1)
# add ones to X for each observation (X0)
X_2d = np.c_[np.ones((500, 1)), X]
# calculate theta that minimizes MSE through Normal Equation
theta_best = np.linalg.inv(X_2d.T.dot(X_2d)).dot(X_2d.T).dot(y)
print('Normal Equation:\n', theta_best)

'''
BATCH GRADIENT DESCENT
'''
# set the learning rate
eta = 0.1
# max number of iterations for GD to try and converge
n_iterations = 1000
# number of observations in the training data, i.e. X
m = 500

# random initialization
theta = np.random.randn(2, 1)

# perform iterations
for iteration in range(n_iterations):
    gradients = 2/m * X_2d.T.dot(X_2d.dot(theta) - y)
    theta = theta - eta * gradients

# print theta values
print('Batch GD:\n', theta)
	'''
	NORMAL EQUATION
	'''
	# generate some random numbers (independent variable)
	X = 5 * np.random.rand(500,1)
	# calculate linearly related (plus some noise) target variable in the form y = 10 + 2x + noise
	y = 10 + 2 * X + np.random.randn(500,1)
	# add ones to X for each observation (X0)
	X_2d = np.c_[np.ones((500, 1)), X]
	# calculate theta that minimizes MSE through Normal Equation
	theta_best = np.linalg.inv(X_2d.T.dot(X_2d)).dot(X_2d.T).dot(y)
	print('Normal Equation:\n', theta_best)

	'''
	BATCH GRADIENT DESCENT
	'''
	# set the learning rate
	eta = 0.1
	# max number of iterations for GD to try and converge
	n_iterations = 1000
	# number of observations in the training data, i.e. X
	m = 500

	# random initialization
	theta = np.random.randn(2, 1)

	# perform iterations
	for iteration in range(n_iterations):
	gradients = 2/m * X_2d.T.dot(X_2d.dot(theta) - y)
	theta = theta - eta * gradients

	# print theta values
	print('Batch GD:\n', theta)