Skip to content

Instantly share code, notes, and snippets.

Last active January 1, 2019 22:01
Show Gist options
  • Save yanfengliu/9f32a0508ddebd41d32f61c2a7338056 to your computer and use it in GitHub Desktop.
Save yanfengliu/9f32a0508ddebd41d32f61c2a7338056 to your computer and use it in GitHub Desktop.
Solving inverse kinematics using a neural network, assuming 2D environment, a robot arm with 2 segments, each of length 1
import keras
import numpy as np
from keras.models import Sequential, Model
from keras.layers import Dense, Activation, LeakyReLU, Input, Lambda, Concatenate
from keras.losses import mean_absolute_error, mean_squared_error
import os
import sys
%matplotlib inline
import matplotlib.pyplot as plt
from keras import optimizers
from keras import metrics
import tensorflow as tf
import keras.backend as K
from IPython.display import clear_output
import math
def transform_matrix(theta, d, a, alpha):
return np.array([[np.cos(theta), -np.sin(theta)*np.cos(alpha), np.sin(theta)*np.sin(alpha), a*np.cos(theta)],
[np.sin(theta), np.cos(theta)*np.cos(alpha), -np.cos(theta)*np.sin(alpha), a*np.sin(theta)],
[0, np.sin(alpha), np.cos(alpha), d],
[0, 0, 0, 1]])
def forward_kinematics_2(theta1, theta2):
T00 = transform_matrix(theta1,0,1,0)
T01 = transform_matrix(theta2,0,1,0)
pos = [0, 0, 0, 1]
Etip = np.matmul(np.matmul(T00, T01), pos)
return T00, T01, Etip
def get_positions_2(theta):
# assuming theta is already in radian
theta1 = theta[0]
theta2 = theta[1]
T00, T01, Etip = forward_kinematics_2(theta1, theta2)
t = np.transpose(np.array([[0, 0, 0, 1]]))
pos_1 = np.matmul(T00, t)
# only return first 2 elements as xy
return np.array([pos_1[:2], np.reshape(Etip[:2], (2, 1))])
def transform_matrix_tensor(theta, d, a, alpha):
# tensor version of transform matrix
matrix = [[tf.cos(theta), tf.multiply(-tf.sin(theta), tf.cos(alpha)), tf.multiply(tf.sin(theta), tf.sin(alpha)), tf.multiply(a, tf.cos(theta))],
[tf.sin(theta), tf.multiply(tf.cos(theta), tf.cos(alpha)), tf.multiply(-tf.cos(theta), tf.sin(alpha)), tf.multiply(a, tf.sin(theta))],
[tf.zeros_like(theta), tf.sin(alpha), tf.cos(alpha), d],
[tf.zeros_like(theta), tf.zeros_like(theta), tf.zeros_like(theta), tf.ones_like(theta)]]
return matrix
def batch_matmul(location_v, batch_theta_v):
# perform matrix multiplication between the location vector and the transform matrix,
# independently for each example in the batch, but done in a parallel way
zeros = tf.zeros_like(batch_theta_v)
ones = tf.ones_like(batch_theta_v)
m0 = transform_matrix_tensor(batch_theta_v, zeros, ones, zeros)
m = tf.multiply(m0, location_v)
m = tf.reduce_sum(m, axis=1)
m = tf.transpose(m)
return m
def forward_kinematics_loss_2(y_true, y_pred):
# y_true is the xy position
# y_pred is the 2-dimensional theta output
theta1 = y_pred[:, 0]
theta2 = y_pred[:, 1]
zeros = tf.zeros_like(theta1)
zeros = K.expand_dims(zeros, axis=1)
location_v = K.concatenate([zeros, zeros, zeros, zeros+1], axis=1)
location_v = K.expand_dims(location_v, axis=-1)
location_v = K.concatenate([location_v]*4, axis=2)
location_v = tf.transpose(location_v, perm=[2, 1, 0])
end_tip_1st_segment = batch_matmul(location_v, theta1)
location_v = K.expand_dims(end_tip_1st_segment, axis=-1)
location_v = K.concatenate([location_v]*4, axis=2)
location_v = tf.transpose(location_v, perm=[2, 1, 0])
end_tip_2nd_segment = batch_matmul(location_v, theta2)
xy = end_tip_2nd_segment[:, :2]
loss1 = K.mean(K.square(xy - y_true))
pi = tf.constant(math.pi)
loss2 = K.mean(tf.maximum(tf.abs(y_pred)-[[pi, 0.5 * pi]], 0))
loss = loss1 + loss2
return loss
def get_xy_and_theta_2(num):
xy = np.zeros((num, 2))
theta = np.zeros((num, 3))
theta[:,0] = (np.random.random((num)) * 2 * np.pi) - np.pi
theta[:,1] = (np.random.random((num)) * np.pi) - (0.5 * np.pi)
for i in range(num):
_, _, temp = forward_kinematics_2(theta[i,0], theta[i,1])
xy[i, :] = temp[:2]
return xy, theta
model = Sequential([
Dense(256, input_shape=(2,)),
Dense(2) # <==== Change this to the number of angles predicted
adam = optimizers.Adam(lr=1e-6)
loss_hist = []
error_hist = []
EPOCHS = 100000
xy_test, theta_test = get_xy_and_theta_2(10000)
for i in range(EPOCHS):
# train on a mini-batch
print("epoch {}".format(i))
xy_train, theta_train = get_xy_and_theta_2(100)
history =, xy_train, epochs=1, batch_size=1, verbose = 1)
# test the model on the test set
theta_pred = model.predict(xy_test)
xy_pred = np.zeros((theta_pred.shape[0], 2))
for j in range(theta_pred.shape[0]):
a = get_positions_2(np.squeeze(theta_pred[j, :]))
xy_pred[j, :] = a[1, :, 0]
error = np.mean(np.square(xy_pred - xy_test))
# plot (1) loss & (2) mean square error on test set, vs. training steps
plt.figure(figsize=(16, 4))
line1, = plt.plot(error_hist, label="error hist")
line2, = plt.plot(loss_hist, label="loss hist")
plt.title('mean squraed error on test set vs. epoch')
plt.legend((line1, line2), ('error hist', 'loss hist'))
# randomly showcase 12 examples to visually see how the network is doing
xy_temp, theta_temp = get_xy_and_theta_2(12)
fig, ax = plt.subplots(nrows=3, ncols=4, figsize=(16, 12))
for i, row in enumerate(ax):
for j, col in enumerate(row):
idx = j + i * 4
theta = model.predict(np.reshape(xy_temp[idx], (1, 2)))
# plot xy from predicted angles and ground truth, for 2-segment arm
a = get_positions_2(np.squeeze(theta))
col.plot([0, a[0][0]], [0, a[0][1]])
col.plot([a[0][0], a[1][0]], [a[0][1], a[1][1]])
col.plot(xy_temp[idx][0], xy_temp[idx][1], 'bo', markersize=10)
col.plot(a[1][0], a[1][1], 'ro', markersize=10)
col.set_xlim([-3, 3])
col.set_ylim([-3, 3])
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment