Skip to content

Instantly share code, notes, and snippets.

@weicheng113
weicheng113 / actor_critic1.py
Created March 20, 2018 03:20
Batched actor critic with n step TD
import gym
import itertools
import numpy as np
import tensorflow as tf
import tensorflow.contrib.slim as slim
from gym import wrappers
import collections
from DAT257xLab.lib import plotting
from DAT257xLab.lib.running_variance import RunningVariance
@weicheng113
weicheng113 / actor_critic.py
Last active March 12, 2018 01:04
Actor critic with n step TD for cartpole
import gym
import itertools
import numpy as np
import tensorflow as tf
from gym import wrappers
import collections
from DAT257xLab.lib import plotting
from DAT257xLab.lib.running_variance import RunningVariance
@weicheng113
weicheng113 / policy_gradient.py
Last active March 8, 2018 02:40
simple Monte Carlo Policy Gradient for CartPole in Tensorflow
import gym
import itertools
import matplotlib
import numpy as np
import tensorflow as tf
import collections
from dennybritz.lib import plotting
matplotlib.style.use('ggplot')