kaniblu/masked_softmax.py

## masked_softmax.py
import torch
import torch.nn as nn


class MaskedSoftmax(nn.Module):
    def __init__(self):
        super(MaskedSoftmax, self).__init__()
        self.softmax = nn.Softmax(1)

    def forward(self, x, mask=None):
        """
        Performs masked softmax, as simply masking post-softmax can be
        inaccurate
        :param x: [batch_size, num_items]
        :param mask: [batch_size, num_items]
        :return:
        """
        if mask is not None:
            mask = mask.float()
        if mask is not None:
            x_masked = x * mask + (1 - 1 / mask)
        else:
            x_masked = x
        x_max = x_masked.max(1)[0]
        x_exp = (x - x_max.unsqueeze(-1)).exp()
        if mask is not None:
            x_exp = x_exp * mask.float()
        return x_exp / x_exp.sum(1).unsqueeze(-1)
	import torch
	import torch.nn as nn


	class MaskedSoftmax(nn.Module):
	def __init__(self):
	super(MaskedSoftmax, self).__init__()
	self.softmax = nn.Softmax(1)

	def forward(self, x, mask=None):
	"""
	Performs masked softmax, as simply masking post-softmax can be
	inaccurate
	:param x: [batch_size, num_items]
	:param mask: [batch_size, num_items]
	:return:
	"""
	if mask is not None:
	mask = mask.float()
	if mask is not None:
	x_masked = x * mask + (1 - 1 / mask)
	else:
	x_masked = x
	x_max = x_masked.max(1)[0]
	x_exp = (x - x_max.unsqueeze(-1)).exp()
	if mask is not None:
	x_exp = x_exp * mask.float()
	return x_exp / x_exp.sum(1).unsqueeze(-1)