cinjon/eosmask.py

## eosmask.py
q_y = tf.contrib.distributions.RelaxedOneHotCategorical(tau, logits=a1_logits)
y = q_y.sample()
y_hard = tf.cast(tf.one_hot(tf.argmax(y, -1), output_size), y.dtype)

# append a zero out onto the back so that argmax doesn't use an incorrect indice.
one_hot = np.array([0]*(output_size - 1) + [1]).astype(np.float32)
concat_one_hot = tf.expand_dims(tf.expand_dims(tf.convert_to_tensor(one_hot), 0), 0)
concat_one_hot = tf.tile(concat_one_hot, tf.stack([tf.shape(y_hard)[0], 1, 1]))
concat_y_hard = tf.concat([y_hard, concat_one_hot], 1)

# we need to find the first message that's predicting a 2 and then zero out from there.
first_zeros = tf.argmax(tf.to_int32(tf.reduce_all(tf.equal(concat_y_hard, one_hot), 2)), 1)
mask = tf.to_float(tf.sequence_mask(first_zeros, num_binary_messages + 1))
argmax_messages = ((tf.argmax(concat_y_hard, 2) + 1) * tf.to_int64(mask))[:, :num_binary_messages]
y_hard = tf.one_hot(argmax_messages, output_size)

messages = tf.stop_gradient(y_hard - y) + y
	q_y = tf.contrib.distributions.RelaxedOneHotCategorical(tau, logits=a1_logits)
	y = q_y.sample()
	y_hard = tf.cast(tf.one_hot(tf.argmax(y, -1), output_size), y.dtype)

	# append a zero out onto the back so that argmax doesn't use an incorrect indice.
	one_hot = np.array([0]*(output_size - 1) + [1]).astype(np.float32)
	concat_one_hot = tf.expand_dims(tf.expand_dims(tf.convert_to_tensor(one_hot), 0), 0)
	concat_one_hot = tf.tile(concat_one_hot, tf.stack([tf.shape(y_hard)[0], 1, 1]))
	concat_y_hard = tf.concat([y_hard, concat_one_hot], 1)

	# we need to find the first message that's predicting a 2 and then zero out from there.
	first_zeros = tf.argmax(tf.to_int32(tf.reduce_all(tf.equal(concat_y_hard, one_hot), 2)), 1)
	mask = tf.to_float(tf.sequence_mask(first_zeros, num_binary_messages + 1))
	argmax_messages = ((tf.argmax(concat_y_hard, 2) + 1) * tf.to_int64(mask))[:, :num_binary_messages]
	y_hard = tf.one_hot(argmax_messages, output_size)

	messages = tf.stop_gradient(y_hard - y) + y