Pavel C PavelCz

## debug_ray_cache.py
"""Simple example of setting up a multi-agent policy mapping.

Control the number of agents and policies via --num-agents and --num-policies.

This works with hundreds of agents and policies, but note that initializing
many TF policies will take some time.

Also, TF evals might slow down with large numbers of policies. To debug TF
execution, set the TF_TIMELINE_DIR environment variable.
"""

## slow_rllib_init.py
import time

import gym
import ray
from ray.rllib.agents.ppo import PPOTrainer
from ray.rllib.examples.env.multi_agent import MultiAgentCartPole
from ray.tune import register_env

ray.init()

## transfer-learning.txt
# get transfer learning training data
!git clone https://github.com/aditya9898/transfer-learning.git
!mv transfer-learning/train train
	"""Simple example of setting up a multi-agent policy mapping.

	Control the number of agents and policies via --num-agents and --num-policies.

	This works with hundreds of agents and policies, but note that initializing
	many TF policies will take some time.

	Also, TF evals might slow down with large numbers of policies. To debug TF
	execution, set the TF_TIMELINE_DIR environment variable.
	"""
	import time

	import gym
	import ray
	from ray.rllib.agents.ppo import PPOTrainer
	from ray.rllib.examples.env.multi_agent import MultiAgentCartPole
	from ray.tune import register_env

	ray.init()
	# get transfer learning training data
	!git clone https://github.com/aditya9898/transfer-learning.git
	!mv transfer-learning/train train