Donal Byrne djbyrne

## DQN Pong Bolts Example.py
from pl_bolts.models.rl.common import wrappers, cli
from pl_bolts.models.rl.dqn_model import DQN

parser = argparse.ArgumentParser(add_help=False)

# Trainer args
parser = pl.Trainer.add_argparse_args(parser)

# Model args
parser = DQN.add_model_specific_args(parser)

## enlightened_dqn.py
class DQNLightning(pl.LightningModule):
    """ Basic DQN Model """

    def __init__(self, hparams: argparse.Namespace) -> None:
        super().__init__()
        self.hparams = hparams

        self.env = gym.make(self.hparams.env)
        obs_size = self.env.observation_space.shape[0]
        n_actions = self.env.action_space.n

## dqn_agent.py
class Agent:
    """
    Base Agent class handeling the interaction with the environment

    Args:
        env: training environment
        replay_buffer: replay buffer storing experiences
    """

    def __init__(self, env: gym.Env, replay_buffer: ReplayBuffer) -> None:

## replay_dataset.py
class RLDataset(IterableDataset):
    """
    Iterable Dataset containing the ReplayBuffer
    which will be updated with new experiences during training

    Args:
        buffer: replay buffer
        sample_size: number of experiences to sample at a time
    """

## replay_buffer.py
# Named tuple for storing experience steps gathered in training
Experience = collections.namedtuple(
    'Experience', field_names=['state', 'action', 'reward',
                               'done', 'new_state'])

class ReplayBuffer:
    """
    Replay Buffer for storing past experiences allowing the agent to learn from them

    Args:

## dqn_mlp.py
class DQN(nn.Module):
    """
    Simple MLP network

    Args:
        obs_size: observation/state size of the environment
        n_actions: number of discrete actions available in the environment
        hidden_size: size of hidden layers
    """


## TD3.ipynb

      
              1 file
            
          
              3 forks
            
          
              0 comments
            
          
              5 stars
            
          
                djbyrne
                / TD3.ipynb
            
            
              Last active
              February 5, 2023 02:02
            
          
      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## control.ipynb

      
              1 file
            
          
              1 fork
            
          
              0 comments
            
          
              2 stars
            
          
                djbyrne
                / control.ipynb
            
            
              Last active
              April 24, 2023 03:26
            
          
      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
      
    
## prediction.ipynb

      
              1 file
            
          
              1 fork
            
          
              2 comments
            
          
              3 stars
            
          
                djbyrne
                / prediction.ipynb
            
            
              Last active
              May 3, 2023 01:16
            
          
      Sorry, something went wrong. Reload?
      Sorry, we cannot display this file.
      Sorry, this file is invalid so it cannot be displayed.
      
          Viewer requires iframe.
	from pl_bolts.models.rl.common import wrappers, cli
	from pl_bolts.models.rl.dqn_model import DQN

	parser = argparse.ArgumentParser(add_help=False)

	# Trainer args
	parser = pl.Trainer.add_argparse_args(parser)

	# Model args
	parser = DQN.add_model_specific_args(parser)
	class DQNLightning(pl.LightningModule):
	""" Basic DQN Model """

	def __init__(self, hparams: argparse.Namespace) -> None:
	super().__init__()
	self.hparams = hparams

	self.env = gym.make(self.hparams.env)
	obs_size = self.env.observation_space.shape[0]
	n_actions = self.env.action_space.n
	class Agent:
	"""
	Base Agent class handeling the interaction with the environment

	Args:
	env: training environment
	replay_buffer: replay buffer storing experiences
	"""

	def __init__(self, env: gym.Env, replay_buffer: ReplayBuffer) -> None:
	class RLDataset(IterableDataset):
	"""
	Iterable Dataset containing the ReplayBuffer
	which will be updated with new experiences during training

	Args:
	buffer: replay buffer
	sample_size: number of experiences to sample at a time
	"""
	# Named tuple for storing experience steps gathered in training
	Experience = collections.namedtuple(
	'Experience', field_names=['state', 'action', 'reward',
	'done', 'new_state'])

	class ReplayBuffer:
	"""
	Replay Buffer for storing past experiences allowing the agent to learn from them

	Args:
	class DQN(nn.Module):
	"""
	Simple MLP network

	Args:
	obs_size: observation/state size of the environment
	n_actions: number of discrete actions available in the environment
	hidden_size: size of hidden layers
	"""