Skip to content

Instantly share code, notes, and snippets.

@flxh
flxh / sac.py
Last active January 31, 2019 21:05
soft actor critic
import tensorflow as tf
import tensorflow_probability as tfp
import gym
from collections import deque
from random import sample
import numpy as np
from datetime import datetime
COMMENT = 'comment'
GRADIENT_NORM = 5