Skip to content

Instantly share code, notes, and snippets.

View flyman3046's full-sized avatar

Fei Zheng flyman3046

View GitHub Profile
@flyman3046
flyman3046 / es-CartPole.py
Last active February 6, 2020 06:08
Implementation of Evolution Strategies to Solve CartPole-v0
# https://gist.github.com/karpathy/77fbb6a8dac5395f1b73e7a89300318d
import gym
import numpy as np
def f(env, weight):
total_reward = 0.0
num_run = 100
for t in range(num_run):
observation = env.reset()
for i in range(300):
@flyman3046
flyman3046 / tensorflow-sim-data.py
Created March 26, 2017 23:56
Used tensorflow to solve a simulated data classification
# Simulated data and plot comes from: http://cs231n.github.io/neural-networks-case-study/
import tensorflow as tf
import numpy as np
import random
import matplotlib.pyplot as plt
plt.rcParams['figure.figsize'] = (10.0, 8.0) # set default size of plots
plt.rcParams['image.interpolation'] = 'nearest'
plt.rcParams['image.cmap'] = 'gray'
@flyman3046
flyman3046 / pg-CartPole-tensorflow.py
Last active March 21, 2017 00:32
Solve CartPole with tensorflow
# Solve CartPole-v0
import tensorflow as tf
import numpy as np
import gym
import matplotlib.pyplot as plt
# hyperparameters
H = 10 # number of hidden layer neurons
learning_rate = 1e-3
@flyman3046
flyman3046 / pg-CartPole-baseline.py
Created March 10, 2017 05:01
Solve CartPole with policy gradient with advantage
# original code: https://github.com/kvfrans/openai-cartpole/blob/master/cartpole-policygradient.py
import tensorflow as tf
import numpy as np
import random
import gym
import math
import matplotlib.pyplot as plt
def softmax(x):
# Original code from https://gist.github.com/karpathy/a4166c7fe253700972fcbc77e4ea32c5
# Use it to solve MountainCar-v0
import numpy as np
import gym
import matplotlib.pyplot as plt
# hyperparameters
H = 10 # number of hidden layer neurons
batch_size = 1 # every how many episodes to do a param update?
@flyman3046
flyman3046 / pg-CartPole-MultiProb.py
Last active March 2, 2017 21:15
Use the standard one-hot encoding
# Original code from https://gist.github.com/karpathy/a4166c7fe253700972fcbc77e4ea32c5
# Use it to solve CartPole-v0
import numpy as np
import gym
# hyperparameters
H = 10 # number of hidden layer neurons
batch_size = 5 # every how many episodes to do a param update?
learning_rate = 1e-3
gamma = 0.99 # discount factor for reward
@flyman3046
flyman3046 / pg-CartPole.py
Last active February 17, 2017 06:38
Policy Gradient to solve CartPole-v0 in OpenAI gym
# Original code from https://gist.github.com/karpathy/a4166c7fe253700972fcbc77e4ea32c5
# Use it to solve CartPole-v0
import numpy as np
import gym
# hyperparameters
H = 10 # number of hidden layer neurons
batch_size = 5 # every how many episodes to do a param update?
learning_rate = 1e-2
gamma = 0.99 # discount factor for reward