Source code for explauto.environment.environment

import time
from numpy import zeros, array, hstack
from abc import ABCMeta, abstractmethod

from ..utils.config import make_configuration
from ..utils.observer import Observable
from ..utils import rand_bounds
from .testcase import Lattice

from . import environments

[docs]class Environment(Observable):
    """ Abstract class to define environments.

        When defining your sub-environment, you should specify whether they could be forked and run in different processes through the use_process class variable. By default, it is set to False to guarantee that the code will work.

    """
    __metaclass__ = ABCMeta
    use_process = False

    def __init__(self, m_mins, m_maxs, s_mins, s_maxs):
        """
        :param numpy.array m_mins, m_maxs, s_mins, s_maxs: bounds of the motor (m) and sensory (s) spaces

        """
        Observable.__init__(self)

        self.conf = make_configuration(m_mins, m_maxs, s_mins, s_maxs)

    @classmethod
[docs]    def from_configuration(cls, env_name, config_name='default'):
        """ Environment factory from name and configuration strings.

        :param str env_name: the name string of the environment

        :param str config_name: the configuration string for env_name

        Environment name strings are available using::

            from explauto.environment import environments
            print environments.keys()

        This will return the available environment names, something like::

            '['npendulum', 'pendulum', 'simple_arm']'

        Once you have choose an environment, e.g. 'simple_arm', corresponding available configurations are available using::

            env_cls, env_configs, _ = environments['simple_arm']
            print env_configs.keys()

        This will return the available configuration names for the 'simple_arm' environment, something like::

            '['mid_dimensional', 'default', 'high_dim_high_s_range', 'low_dimensional', 'high_dimensional']'

        Once you have choose a configuration, for example the 'mid_dimensional' one, you can contruct the environment using::

            from explauto import Environment
            my_environment = Environment.from_configuration('simple_arm', 'mid_dimensional')

        Or, in an equivalent manner::

            my_environment = env_cls(**env_configs['mid_dimensional'])
        """
        env_cls, env_configs, _ = environments[env_name]
        return env_cls(**env_configs[config_name])

[docs]    def one_update(self, m_ag, log=True):
        m_env = self.compute_motor_command(m_ag)
        s = self.compute_sensori_effect(m_env)

        if log:
            self.emit('motor', m_env)
            self.emit('sensori', s)

        return s

[docs]    def update(self, m_ag, log=True):
        """ Computes sensorimotor values from motor orders.

        :param numpy.array m_ag: a motor command with shape (self.conf.m_ndims, ) or a set of n motor commands of shape (n, self.conf.m_ndims)

        :param bool log: emit the motor and sensory values for logging purpose (default: True).

        :returns: an array of shape (self.conf.ndims, ) or (n, self.conf.ndims) according to the shape of the m_ag parameter, containing the motor values (which can be different from m_ag, e.g. bounded according to self.conf.m_bounds) and the corresponding sensory values.

        .. note:: self.conf.ndims = self.conf.m_ndims + self.conf.s_ndims is the dimensionality of the sensorimotor space (dim of the motor space + dim of the sensory space).
        """

        self.reset()
        if len(array(m_ag).shape) == 1:
            s = self.one_update(m_ag, log)
        else:
            s = []
            for m in m_ag:
                s.append(self.one_update(m, log))
            s = array(s)
        return s

[docs]    def reset(self):
        """ reset environment before update """
        pass

    @abstractmethod
[docs]    def compute_motor_command(self, ag_state):
        raise NotImplementedError

    @abstractmethod
[docs]    def compute_sensori_effect(self):
        raise NotImplementedError

[docs]    def random_motors(self, n=1):
        return rand_bounds(self.conf.bounds[:, self.conf.m_dims], n)

[docs]    def dataset(self, orders):
        return array([hstack((m, self.update(m))) for m in orders])

[docs]    def uniform_sensor(self, n_cases=100):
        n_random_motor = n_cases * 100
        m_feats = tuple(range(-self.conf.m_ndims, 0))
        s_feats = tuple(range(self.conf.s_ndims))
        m_bounds = tuple([(self.conf.m_mins[d], self.conf.m_maxs[d])
                          for d in self.conf.m_dims])

        ms_uniform_motor = self.dataset(self.random_motors(n_random_motor))
        resolution = max(2, int((1.3*n_cases)**(1.0/len(s_feats))))
        observations = []
        for ms in ms_uniform_motor:
            observations.append((ms[self.conf.m_dims], ms[self.conf.s_dims]))
        lattice = Lattice(s_feats, observations, res=resolution)
        result = []
        for ms in list(lattice.grid.values()):
            result.append(ms[1])
        return array(result)