ChunML/text_generation_pt_8.py

## text_generation_pt_8.py
    for e in range(50):
        batches = get_batches(in_text, out_text, flags.batch_size, flags.seq_size)
        state_h, state_c = net.zero_state(flags.batch_size)

        # Transfer data to GPU
        state_h = state_h.to(device)
        state_c = state_c.to(device)
        for x, y in batches:
            iteration += 1

            # Tell it we are in training mode
            net.train()

            # Reset all gradients
            optimizer.zero_grad()

            # Transfer data to GPU
            x = torch.tensor(x).to(device)
            y = torch.tensor(y).to(device)

            logits, (state_h, state_c) = net(x, (state_h, state_c))
            loss = criterion(logits.transpose(1, 2), y)

            state_h = state_h.detach()
            state_c = state_c.detach()

            loss_value = loss.item()

            # Perform back-propagation
            loss.backward()

            # Update the network's parameters
            optimizer.step()
	for e in range(50):
	batches = get_batches(in_text, out_text, flags.batch_size, flags.seq_size)
	state_h, state_c = net.zero_state(flags.batch_size)

	# Transfer data to GPU
	state_h = state_h.to(device)
	state_c = state_c.to(device)
	for x, y in batches:
	iteration += 1

	# Tell it we are in training mode
	net.train()

	# Reset all gradients
	optimizer.zero_grad()

	# Transfer data to GPU
	x = torch.tensor(x).to(device)
	y = torch.tensor(y).to(device)

	logits, (state_h, state_c) = net(x, (state_h, state_c))
	loss = criterion(logits.transpose(1, 2), y)

	state_h = state_h.detach()
	state_c = state_c.detach()

	loss_value = loss.item()

	# Perform back-propagation
	loss.backward()

	# Update the network's parameters
	optimizer.step()