Last active April 12, 2021 02:26
# inspired by the post:
# tl;dr
# If you are using numpy random generator with ``,
# you might get identical results either across different workers or epochs
# disclaimer: this might not be the best choice since setting worker to be persistent requires additional RAM.
# Welcome for any idea
# Here's a simple fix with torch>=1.7.0
# See the original example here:
{"0": "tench", "1": "goldfish", "2": "great white shark", "3": "tiger shark", "4": "hammerhead", "5": "electric ray", "6": "stingray,", "7": "cock,", "8": "hen,", "9": "ostrich", "10": "brambling", "11": "goldfinch", "12": "house finch", "13": "junco", "14": "indigo bunting", "15": "robin", "16": "bulbul,", "17": "jay,", "18": "magpie,", "19": "chickadee,", "20": "water ouzel", "21": "kite,", "22": "bald eagle", "23": "vulture,", "24": "great grey owl", "25": "European fire salamander", "26": "common newt", "27": "eft,", "28": "spotted salamander", "29": "axolotl", "30": "bullfrog", "31": "tree frog", "32": "tailed frog", "33": "loggerhead", "34": "leatherback turtle", "35": "mud turtle,", "36": "terrapin,", "37": "box turtle", "38": "banded gecko,", "39": "common iguana", "40": "American chameleon", "41": "whiptail", "42": "agama,", "43": "frilled lizard", "44": "alligator lizard,", "45": "Gila monster", "46": "green lizard", "47": "African chameleon", "48": "Komodo dragon", "49": "African crocodile", "50":
import imageio
import numpy as np
from utils import *
mode = 'sgd' # sgd, fisher, or dig_fisher
X_train, X_test, t_train, t_test = get_data()
W = get_model()
import torch
import imageio
import numpy as np
import seaborn
import matplotlib.pyplot as plt
import matplotlib
# data generation: y = ax + b
simple lstm cell with layernorm
# using pytorch==0.4.0
import math
import torch
import torch.nn as nn
import torch.nn.functional as F
from torch.nn.parameter import Parameter
from torch.nn.modules.rnn import RNNCellBase
from torch.nn._functions.thnn import rnnFusedPointwise as fusedBackend
import argparse
import gym
import numpy as np
from itertools import count
from collections import namedtuple, deque
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
Since the structure of each algorithms in baselines is different, we implementation the sample/load function in different ways.
# code locate in baselines/gail
def sample(algo, load_model_path, policy_fn):
assert algo in ['trpo', 'ppo', 'acktr', 'ddpg', 'a2c']
if algo in ['trpo', 'ppo']:
with tf.Session() as sess:
# manually build graph
policy = policy_fn()
# load model
Since the structure of each algorithms in baselines is different, we implementation the save function in different ways.
# for model in `trpo_mpi`, `ppo`
class CnnPolicy():
def __init__():
# build graph
_ = conv2d()
_ = conv2d()
def step():, feed_dict)
implement noisy cross entropy method for rl
# modified from
import gym
import numpy as np
import matplotlib.pyplot as plt
env = gym.make('CartPole-v0')
#vector of means(mu) and standard dev(sigma) for each paramater