fxia22/gist:85573cced6f268c63d6f9d2a51e1cd83

## gistfile1.txt
from gibson2.core.physics.robot_locomotors import *
from gibson2.core.simulator import Simulator
from gibson2.core.physics.scene import *
import gibson2
from gibson2.utils.utils import parse_config, rotate_vector_3d, l2_distance, quatToXYZW
from gibson2.envs.base_env import BaseEnv
from transforms3d.euler import euler2quat
from collections import OrderedDict
from gibson2.envs.locomotor_env import *
import atexit
import multiprocessing
import sys
import traceback
from tqdm import tqdm
class ParallelNavEnvironment(NavigateEnv):
  """Batch together environments and simulate them in external processes.

  The environments are created in external processes by calling the provided
  callables. This can be an environment class, or a function creating the
  environment and potentially wrapping it. The returned environment should not
  access global variables.
  """

  def __init__(self, env_constructors, blocking=False, flatten=False):
    """Batch together environments and simulate them in external processes.

    The environments can be different but must use the same action and
    observation specs.

    Args:
      env_constructors: List of callables that create environments.
      blocking: Whether to step environments one after another.
      flatten: Boolean, whether to use flatten action and time_steps during
        communication to reduce overhead.

    Raises:
      ValueError: If the action or observation specs don't match.
    """
    self._envs = [ProcessPyEnvironment(ctor, flatten=flatten)
                  for ctor in env_constructors]
    self._num_envs = len(env_constructors)
    self.start()
    self.action_space = self._envs[0].action_space
    self.observation_space = self._envs[0].observation_space
    self._blocking = blocking
    self._flatten = flatten

  def start(self):
    #tf.logging.info('Starting all processes.')
    for env in self._envs:
      env.start()
    #tf.logging.info('All processes started.')

  @property
  def batched(self):
    return True

  @property
  def batch_size(self):
    return self._num_envs

  def reset(self):
    """Reset all environments and combine the resulting observation.

    Returns:
      Time step with batch dimension.
    """
    time_steps = [env.reset(self._blocking) for env in self._envs]
    if not self._blocking:
      time_steps = [promise() for promise in time_steps]
    return time_steps

  def step(self, actions):
    """Forward a batch of actions to the wrapped environments.

    Args:
      actions: Batched action, possibly nested, to apply to the environment.

    Raises:
      ValueError: Invalid actions.

    Returns:
      Batch of observations, rewards, and done flags.
    """
    time_steps = [
        env.step(action, self._blocking)
        for env, action in zip(self._envs, actions)]
    # When blocking is False we get promises that need to be called.
    if not self._blocking:
      time_steps = [promise() for promise in time_steps]
    return time_steps

  def close(self):
    """Close all external process."""
    for env in self._envs:
      env.close()

  #def _stack_time_steps(self, time_steps):
  #  """Given a list of TimeStep, combine to one with a batch dimension."""
  #  if self._flatten:
  #    return fast_map_structure_flatten(lambda *arrays: np.stack(arrays),
  #                                      self._time_step_spec,
  #                                      *time_steps)
  #  else:
  #    return fast_map_structure(lambda *arrays: np.stack(arrays), *time_steps)

  #def _unstack_actions(self, batched_actions):
  #  """Returns a list of actions from potentially nested batch of actions."""
  #  flattened_actions = nest.flatten(batched_actions)
  #  if self._flatten:
  #    unstacked_actions = zip(*flattened_actions)
  #  else:
  #    unstacked_actions = [nest.pack_sequence_as(batched_actions, actions)
  #                         for actions in zip(*flattened_actions)]
  #  return unstacked_actions


## TODO(sguada) Move to utils.
#def fast_map_structure_flatten(func, structure, *flat_structure):
#  entries = zip(*flat_structure)
#  return nest.pack_sequence_as(structure, [func(*x) for x in entries])


#def fast_map_structure(func, *structure):
#  flat_structure = [nest.flatten(s) for s in structure]
#  entries = zip(*flat_structure)

#  return nest.pack_sequence_as(
#      structure[0], [func(*x) for x in entries])

class ProcessPyEnvironment(object):
  """Step a single env in a separate process for lock free paralellism."""

  # Message types for communication via the pipe.
  _READY = 1
  _ACCESS = 2
  _CALL = 3
  _RESULT = 4
  _EXCEPTION = 5
  _CLOSE = 6

  def __init__(self, env_constructor, flatten=False):
    """Step environment in a separate process for lock free paralellism.

    The environment is created in an external process by calling the provided
    callable. This can be an environment class, or a function creating the
    environment and potentially wrapping it. The returned environment should
    not access global variables.

    Args:
      env_constructor: Callable that creates and returns a Python environment.
      flatten: Boolean, whether to assume flattened actions and time_steps
        during communication to avoid overhead.

    Attributes:
      observation_spec: The cached observation spec of the environment.
      action_spec: The cached action spec of the environment.
      time_step_spec: The cached time step spec of the environment.
    """
    self._env_constructor = env_constructor
    self._flatten = flatten
    #self._observation_spec = None
    #self._action_spec = None
    #self._time_step_spec = None

  def start(self):
    """Start the process."""
    self._conn, conn = multiprocessing.Pipe()
    self._process = multiprocessing.Process(
        target=self._worker,
        args=(conn, self._env_constructor, self._flatten))
    atexit.register(self.close)
    self._process.start()
    result = self._conn.recv()
    if isinstance(result, Exception):
      self._conn.close()
      self._process.join(5)
      raise result
    assert result is self._READY, result

  #def observation_spec(self):
  #  if not self._observation_spec:
  #    self._observation_spec = self.call('observation_spec')()
  #  return self._observation_spec

  #def action_spec(self):
  #  if not self._action_spec:
  #    self._action_spec = self.call('action_spec')()
  #  return self._action_spec

  #def time_step_spec(self):
  #  if not self._time_step_spec:
  #    self._time_step_spec = self.call('time_step_spec')()
  #  return self._time_step_spec

  def __getattr__(self, name):
    """Request an attribute from the environment.

    Note that this involves communication with the external process, so it can
    be slow.

    Args:
      name: Attribute to access.

    Returns:
      Value of the attribute.
    """
    self._conn.send((self._ACCESS, name))
    return self._receive()

  def call(self, name, *args, **kwargs):
    """Asynchronously call a method of the external environment.

    Args:
      name: Name of the method to call.
      *args: Positional arguments to forward to the method.
      **kwargs: Keyword arguments to forward to the method.

    Returns:
      Promise object that blocks and provides the return value when called.
    """
    payload = name, args, kwargs
    self._conn.send((self._CALL, payload))
    return self._receive

  def close(self):
    """Send a close message to the external process and join it."""
    try:
      self._conn.send((self._CLOSE, None))
      self._conn.close()
    except IOError:
      # The connection was already closed.
      pass
    self._process.join(5)

  def step(self, action, blocking=True):
    """Step the environment.

    Args:
      action: The action to apply to the environment.
      blocking: Whether to wait for the result.

    Returns:
      time step when blocking, otherwise callable that returns the time step.
    """
    promise = self.call('step', action)
    if blocking:
      return promise()
    else:
      return promise

  def reset(self, blocking=True):
    """Reset the environment.

    Args:
      blocking: Whether to wait for the result.

    Returns:
      New observation when blocking, otherwise callable that returns the new
      observation.
    """
    promise = self.call('reset')
    if blocking:
      return promise()
    else:
      return promise

  def _receive(self):
    """Wait for a message from the worker process and return its payload.

    Raises:
      Exception: An exception was raised inside the worker process.
      KeyError: The reveived message is of an unknown type.

    Returns:
      Payload object of the message.
    """
    message, payload = self._conn.recv()
    #print(message, payload)
    # Re-raise exceptions in the main process.
    if message == self._EXCEPTION:
      stacktrace = payload
      raise Exception(stacktrace)
    if message == self._RESULT:
      return payload
    self.close()
    raise KeyError('Received message of unexpected type {}'.format(message))

  def _worker(self, conn, env_constructor, flatten=False):
    """The process waits for actions and sends back environment results.

    Args:
      conn: Connection for communication to the main process.
      env_constructor: env_constructor for the OpenAI Gym environment.
      flatten: Boolean, whether to assume flattened actions and time_steps
        during communication to avoid overhead.

    Raises:
      KeyError: When receiving a message of unknown type.
    """
    try:
      env = env_constructor()
      #action_spec = env.action_spec()
      conn.send(self._READY)  # Ready.
      while True:
        #print(len(self._conn._cache))
        try:
          # Only block for short times to have keyboard exceptions be raised.
          if not conn.poll(0.1):
            continue
          message, payload = conn.recv()
        except (EOFError, KeyboardInterrupt):
          break
        if message == self._ACCESS:
          name = payload
          result = getattr(env, name)
          conn.send((self._RESULT, result))
          continue
        if message == self._CALL:
          name, args, kwargs = payload
          if name == 'step' or name == 'reset':
            result = getattr(env, name)(*args, **kwargs)
          #result = []
          #if flatten and name == 'step' or name == 'reset':
          #  args = [nest.pack_sequence_as(action_spec, args[0])]
          #  result = getattr(env, name)(*args, **kwargs)
          #if flatten and name in ['step', 'reset']:
          #  result = nest.flatten(result)
          conn.send((self._RESULT, result))
          continue
        if message == self._CLOSE:
          assert payload is None
          break
        raise KeyError('Received message of unknown type {}'.format(message))
    except Exception:  # pylint: disable=broad-except
      etype, evalue, tb = sys.exc_info()
      stacktrace = ''.join(traceback.format_exception(etype, evalue, tb))
      message = 'Error in environment process: {}'.format(stacktrace)
      #tf.logging.error(message)
      conn.send((self._EXCEPTION, stacktrace))
    finally:
      conn.close()

if __name__ == "__main__":

    config_filename = os.path.join(os.path.dirname(gibson2.__file__), '../test/test.yaml')
    def load_env():
        return NavigateEnv(config_file=config_filename, mode='headless')

    parallel_env = ParallelNavEnvironment([load_env] * 2, blocking=False)
    #from IPython import embed; embed()
    #parallel_env.close()

    from time import time
    for episode in range(10):
        start = time()
        print("episode {}".format(episode))
        parallel_env.reset()
        for i in range(300):
            res =  parallel_env.step([[0, 0.1] for _ in range(2)])
            state, reward, done, _ = res[0]
            if done:
                print("Episode finished after {} timesteps".format(i + 1))
                break
        print("{} elapsed".format(time() - start))
	from gibson2.core.physics.robot_locomotors import *
	from gibson2.core.simulator import Simulator
	from gibson2.core.physics.scene import *
	import gibson2
	from gibson2.utils.utils import parse_config, rotate_vector_3d, l2_distance, quatToXYZW
	from gibson2.envs.base_env import BaseEnv
	from transforms3d.euler import euler2quat
	from collections import OrderedDict
	from gibson2.envs.locomotor_env import *
	import atexit
	import multiprocessing
	import sys
	import traceback
	from tqdm import tqdm
	class ParallelNavEnvironment(NavigateEnv):
	"""Batch together environments and simulate them in external processes.

	The environments are created in external processes by calling the provided
	callables. This can be an environment class, or a function creating the
	environment and potentially wrapping it. The returned environment should not
	access global variables.
	"""

	def __init__(self, env_constructors, blocking=False, flatten=False):
	"""Batch together environments and simulate them in external processes.

	The environments can be different but must use the same action and
	observation specs.

	Args:
	env_constructors: List of callables that create environments.
	blocking: Whether to step environments one after another.
	flatten: Boolean, whether to use flatten action and time_steps during
	communication to reduce overhead.

	Raises:
	ValueError: If the action or observation specs don't match.
	"""
	self._envs = [ProcessPyEnvironment(ctor, flatten=flatten)
	for ctor in env_constructors]
	self._num_envs = len(env_constructors)
	self.start()
	self.action_space = self._envs[0].action_space
	self.observation_space = self._envs[0].observation_space
	self._blocking = blocking
	self._flatten = flatten

	def start(self):
	#tf.logging.info('Starting all processes.')
	for env in self._envs:
	env.start()
	#tf.logging.info('All processes started.')

	@property
	def batched(self):
	return True

	@property
	def batch_size(self):
	return self._num_envs

	def reset(self):
	"""Reset all environments and combine the resulting observation.

	Returns:
	Time step with batch dimension.
	"""
	time_steps = [env.reset(self._blocking) for env in self._envs]
	if not self._blocking:
	time_steps = [promise() for promise in time_steps]
	return time_steps

	def step(self, actions):
	"""Forward a batch of actions to the wrapped environments.

	Args:
	actions: Batched action, possibly nested, to apply to the environment.

	Raises:
	ValueError: Invalid actions.

	Returns:
	Batch of observations, rewards, and done flags.
	"""
	time_steps = [
	env.step(action, self._blocking)
	for env, action in zip(self._envs, actions)]
	# When blocking is False we get promises that need to be called.
	if not self._blocking:
	time_steps = [promise() for promise in time_steps]
	return time_steps

	def close(self):
	"""Close all external process."""
	for env in self._envs:
	env.close()

	#def _stack_time_steps(self, time_steps):
	# """Given a list of TimeStep, combine to one with a batch dimension."""
	# if self._flatten:
	# return fast_map_structure_flatten(lambda *arrays: np.stack(arrays),
	# self._time_step_spec,
	# *time_steps)
	# else:
	# return fast_map_structure(lambda arrays: np.stack(arrays), time_steps)

	#def _unstack_actions(self, batched_actions):
	# """Returns a list of actions from potentially nested batch of actions."""
	# flattened_actions = nest.flatten(batched_actions)
	# if self._flatten:
	# unstacked_actions = zip(*flattened_actions)
	# else:
	# unstacked_actions = [nest.pack_sequence_as(batched_actions, actions)
	# for actions in zip(*flattened_actions)]
	# return unstacked_actions


	## TODO(sguada) Move to utils.
	#def fast_map_structure_flatten(func, structure, *flat_structure):
	# entries = zip(*flat_structure)
	# return nest.pack_sequence_as(structure, [func(*x) for x in entries])


	#def fast_map_structure(func, *structure):
	# flat_structure = [nest.flatten(s) for s in structure]
	# entries = zip(*flat_structure)

	# return nest.pack_sequence_as(
	# structure[0], [func(*x) for x in entries])

	class ProcessPyEnvironment(object):
	"""Step a single env in a separate process for lock free paralellism."""

	# Message types for communication via the pipe.
	_READY = 1
	_ACCESS = 2
	_CALL = 3
	_RESULT = 4
	_EXCEPTION = 5
	_CLOSE = 6

	def __init__(self, env_constructor, flatten=False):
	"""Step environment in a separate process for lock free paralellism.

	The environment is created in an external process by calling the provided
	callable. This can be an environment class, or a function creating the
	environment and potentially wrapping it. The returned environment should
	not access global variables.

	Args:
	env_constructor: Callable that creates and returns a Python environment.
	flatten: Boolean, whether to assume flattened actions and time_steps
	during communication to avoid overhead.

	Attributes:
	observation_spec: The cached observation spec of the environment.
	action_spec: The cached action spec of the environment.
	time_step_spec: The cached time step spec of the environment.
	"""
	self._env_constructor = env_constructor
	self._flatten = flatten
	#self._observation_spec = None
	#self._action_spec = None
	#self._time_step_spec = None

	def start(self):
	"""Start the process."""
	self._conn, conn = multiprocessing.Pipe()
	self._process = multiprocessing.Process(
	target=self._worker,
	args=(conn, self._env_constructor, self._flatten))
	atexit.register(self.close)
	self._process.start()
	result = self._conn.recv()
	if isinstance(result, Exception):
	self._conn.close()
	self._process.join(5)
	raise result
	assert result is self._READY, result

	#def observation_spec(self):
	# if not self._observation_spec:
	# self._observation_spec = self.call('observation_spec')()
	# return self._observation_spec

	#def action_spec(self):
	# if not self._action_spec:
	# self._action_spec = self.call('action_spec')()
	# return self._action_spec

	#def time_step_spec(self):
	# if not self._time_step_spec:
	# self._time_step_spec = self.call('time_step_spec')()
	# return self._time_step_spec

	def __getattr__(self, name):
	"""Request an attribute from the environment.

	Note that this involves communication with the external process, so it can
	be slow.

	Args:
	name: Attribute to access.

	Returns:
	Value of the attribute.
	"""
	self._conn.send((self._ACCESS, name))
	return self._receive()

	def call(self, name, args, *kwargs):
	"""Asynchronously call a method of the external environment.

	Args:
	name: Name of the method to call.
	*args: Positional arguments to forward to the method.
	**kwargs: Keyword arguments to forward to the method.

	Returns:
	Promise object that blocks and provides the return value when called.
	"""
	payload = name, args, kwargs
	self._conn.send((self._CALL, payload))
	return self._receive

	def close(self):
	"""Send a close message to the external process and join it."""
	try:
	self._conn.send((self._CLOSE, None))
	self._conn.close()
	except IOError:
	# The connection was already closed.
	pass
	self._process.join(5)

	def step(self, action, blocking=True):
	"""Step the environment.

	Args:
	action: The action to apply to the environment.
	blocking: Whether to wait for the result.

	Returns:
	time step when blocking, otherwise callable that returns the time step.
	"""
	promise = self.call('step', action)
	if blocking:
	return promise()
	else:
	return promise

	def reset(self, blocking=True):
	"""Reset the environment.

	Args:
	blocking: Whether to wait for the result.

	Returns:
	New observation when blocking, otherwise callable that returns the new
	observation.
	"""
	promise = self.call('reset')
	if blocking:
	return promise()
	else:
	return promise

	def _receive(self):
	"""Wait for a message from the worker process and return its payload.

	Raises:
	Exception: An exception was raised inside the worker process.
	KeyError: The reveived message is of an unknown type.

	Returns:
	Payload object of the message.
	"""
	message, payload = self._conn.recv()
	#print(message, payload)
	# Re-raise exceptions in the main process.
	if message == self._EXCEPTION:
	stacktrace = payload
	raise Exception(stacktrace)
	if message == self._RESULT:
	return payload
	self.close()
	raise KeyError('Received message of unexpected type {}'.format(message))

	def _worker(self, conn, env_constructor, flatten=False):
	"""The process waits for actions and sends back environment results.

	Args:
	conn: Connection for communication to the main process.
	env_constructor: env_constructor for the OpenAI Gym environment.
	flatten: Boolean, whether to assume flattened actions and time_steps
	during communication to avoid overhead.

	Raises:
	KeyError: When receiving a message of unknown type.
	"""
	try:
	env = env_constructor()
	#action_spec = env.action_spec()
	conn.send(self._READY) # Ready.
	while True:
	#print(len(self._conn._cache))
	try:
	# Only block for short times to have keyboard exceptions be raised.
	if not conn.poll(0.1):
	continue
	message, payload = conn.recv()
	except (EOFError, KeyboardInterrupt):
	break
	if message == self._ACCESS:
	name = payload
	result = getattr(env, name)
	conn.send((self._RESULT, result))
	continue
	if message == self._CALL:
	name, args, kwargs = payload
	if name == 'step' or name == 'reset':
	result = getattr(env, name)(args, *kwargs)
	#result = []
	#if flatten and name == 'step' or name == 'reset':
	# args = [nest.pack_sequence_as(action_spec, args[0])]
	# result = getattr(env, name)(args, *kwargs)
	#if flatten and name in ['step', 'reset']:
	# result = nest.flatten(result)
	conn.send((self._RESULT, result))
	continue
	if message == self._CLOSE:
	assert payload is None
	break
	raise KeyError('Received message of unknown type {}'.format(message))
	except Exception: # pylint: disable=broad-except
	etype, evalue, tb = sys.exc_info()
	stacktrace = ''.join(traceback.format_exception(etype, evalue, tb))
	message = 'Error in environment process: {}'.format(stacktrace)
	#tf.logging.error(message)
	conn.send((self._EXCEPTION, stacktrace))
	finally:
	conn.close()

	if __name__ == "__main__":

	config_filename = os.path.join(os.path.dirname(gibson2.__file__), '../test/test.yaml')
	def load_env():
	return NavigateEnv(config_file=config_filename, mode='headless')

	parallel_env = ParallelNavEnvironment([load_env] * 2, blocking=False)
	#from IPython import embed; embed()
	#parallel_env.close()

	from time import time
	for episode in range(10):
	start = time()
	print("episode {}".format(episode))
	parallel_env.reset()
	for i in range(300):
	res = parallel_env.step([[0, 0.1] for _ in range(2)])
	state, reward, done, _ = res[0]
	if done:
	print("Episode finished after {} timesteps".format(i + 1))
	break
	print("{} elapsed".format(time() - start))