Skip to content

Instantly share code, notes, and snippets.

Created January 20, 2017 00:35
Show Gist options
  • Save anonymous/5fc9903990ecec5f09361934920bb999 to your computer and use it in GitHub Desktop.
Save anonymous/5fc9903990ecec5f09361934920bb999 to your computer and use it in GitHub Desktop.
import numpy as np
import tensorflow as tf
class RNN_config(object):
num_steps = 5
batch_size = 200
num_classes = 2
state_size = 4
learning_rate = 0.1
def __init__(self, num_steps=5, state_size=4):
self.num_steps = num_steps
self.state_size = state_size
def setup_graph(graph, config):
with graph.as_default():
x = tf.placeholder(tf.int32, [config.batch_size, None], name='input_placeholder')
y = tf.placeholder(tf.int32, [config.batch_size, None], name='labels_placeholder')
default_init_state = tf.zeros([config.batch_size, config.state_size])
init_state = tf.placeholder_with_default(default_init_state, [config.batch_size, config.state_size], name='state_placeholder')
rnn_inputs and y_as_list
# Turn our x placeholder into a list of one-hot tensors
# 1. tf.split creates a list of config.num_steps tensors, each with shape [batch_size X 1 X 2]
# 2. tf.squeeze gets rid of the middle dimension from each
# 3. Thus, rnn_inputs is a list of config.num_steps tensors with shape [batch_size, 2]
x_one_hot = tf.one_hot(x, config.num_classes)
rnn_inputs = [tf.squeeze(i,squeeze_dims=[1]) for i in tf.split(1, config.num_steps, x_one_hot)]
# Turn our y placeholder into a list of one-hot tensors
y_one_hot = tf.one_hot(y, config.num_classes)
y_as_list = [tf.squeeze(i, squeeze_dims=[1]) for i in tf.split(1, config.num_steps, y_one_hot)]
Definition of rnn_cell
This is very similar to the __call__ method on Tensorflow's BasicRNNCell. See:
with tf.variable_scope('rnn_cell'):
W = tf.get_variable('W', [config.num_classes + config.state_size, config.state_size])
b = tf.get_variable('b', [config.state_size], initializer=tf.constant_initializer(0.0))
def rnn_cell(rnn_input, state):
with tf.variable_scope('rnn_cell', reuse=True):
W = tf.get_variable('W', [config.num_classes + config.state_size, config.state_size])
b = tf.get_variable('b', [config.state_size], initializer=tf.constant_initializer(0.0))
return tf.tanh(tf.matmul(tf.concat(1, [rnn_input, state]), W) + b)
Adding rnn_cells to graph
This is a simplified version of the "rnn" function from Tensorflow's api. See:
state = init_state
rnn_outputs = []
for rnn_input in rnn_inputs:
state = rnn_cell(rnn_input, state)
final_state = rnn_outputs[-1]
Predictions, loss, training step
Losses and total_loss are simlar to the "sequence_loss_by_example" and "sequence_loss"
functions, respectively, from Tensorflow's api. See:
#logits and predictions
with tf.variable_scope('softmax'):
W = tf.get_variable('W', [config.state_size, config.num_classes])
b = tf.get_variable('b', [config.num_classes], initializer=tf.constant_initializer(0.0))
logits = [tf.matmul(rnn_output, W) + b for rnn_output in rnn_outputs]
predictions = [tf.nn.softmax(logit) for logit in logits]
#losses and train_step
losses = [tf.nn.softmax_cross_entropy_with_logits(logit,label) for logit, label in zip(logits, y_as_list)]
total_loss = tf.reduce_mean(losses)
train_step = tf.train.AdagradOptimizer(config.learning_rate).minimize(total_loss)
return losses, total_loss, final_state, train_step, x, y, init_state
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment