piEsposito/global_doom_variables.py

## global_doom_variables.py
#here we set the global variables
GAMMA = .95
EPISODES = 5000
learning_rate = 0.01

#our net and frame-stacker
stacker = FrameStacker()
policy_net = PolicyNetwork(lr=learning_rate).to(device)

#some lists to write the values
num_steps = []
avg_numsteps = []
all_rewards = []

#we leverage this cell to write our graph to TensorBoard.
writer.add_graph(policy_net, stacker.stack(torch.zeros(84, 84)).unsqueeze(0).to(device))
	#here we set the global variables
	GAMMA = .95
	EPISODES = 5000
	learning_rate = 0.01

	#our net and frame-stacker
	stacker = FrameStacker()
	policy_net = PolicyNetwork(lr=learning_rate).to(device)

	#some lists to write the values
	num_steps = []
	avg_numsteps = []
	all_rewards = []

	#we leverage this cell to write our graph to TensorBoard.
	writer.add_graph(policy_net, stacker.stack(torch.zeros(84, 84)).unsqueeze(0).to(device))