Source code for grid2op.Converter.ToVect

# Copyright (c) 2019-2020, RTE (
# See AUTHORS.txt
# This Source Code Form is subject to the terms of the Mozilla Public License, version 2.0.
# If a copy of the Mozilla Public License, version 2.0 was not distributed with this file,
# you can obtain one at
# SPDX-License-Identifier: MPL-2.0
# This file is part of Grid2Op, Grid2Op a testbed platform to model sequential decision making in power systems.

import numpy as np
from grid2op.Converter.Converters import Converter
from grid2op.dtypes import dt_float, dt_int

[docs]class ToVect(Converter): """ This converters allows to manipulate the vector representation of the actions and observations. In this converter: - `encoded_act` are numpy ndarray - `transformed_obs` are numpy ndarray (read more about these concepts by looking at the documentation of :class:`grid2op.Converter.Converters`) It is convertible to a gym representation (like the original action space) in the form of a spaces.Box representing a continuous action space (even though most component are probably discrete). Note that if converted to a gym space, it is unlikely the method "sample" will yield to valid results. Most of the time it should generate Ambiguous action that will not be handled by grid2op. **NB** the conversion to a gym space should be done thanks to the :class:`grid2op.Converter.GymActionSpace`. """ def __init__(self, action_space): Converter.__init__(self, action_space) self.init_action_space = action_space self.__class__ = ToVect.init_grid(action_space) self.do_nothing_vect = action_space({}).to_vect() # for gym conversion self.__gym_action_space = None self.__dict_space = None self.__order_gym = None self.__dtypes_gym = None self.__shapes_gym = None self.__order_gym_2_me = None self.__order_me_2_gym = None
[docs] def convert_obs(self, obs): """ This converter will match the observation to a vector, using the :func:`grid2op.Observation.BaseObservation.to_vect` function. Parameters ---------- obs: :class:`grid2op.Observation.Observation` The observation, that will be processed into a numpy ndarray vector. Returns ------- transformed_obs: ``numpy.ndarray`` The vector representation of the action. """ return obs.to_vect()
[docs] def convert_act(self, encoded_act): """ In this converter `encoded_act` is a numpy ndarray. This function transforms it back to a valid action. Parameters ---------- encoded_act: ``numpy.ndarray`` The action, represented as a vector Returns ------- regular_act: :class:`grid2op.Action.Action` The corresponding action transformed with the :func:`grid2op.Action.BaseAction.from_vect`. """ res = self.__call__({}) res.from_vect(encoded_act, check_legit=False) return res
def _init_gym_converter(self): if self.__gym_action_space is None: # lazy import from gym import spaces from grid2op.gym_compat import GymActionSpace # i do that not to duplicate the code of the low / high bounds gym_action_space = GymActionSpace(self.init_action_space) low = tuple() high = tuple() order_gym = [] dtypes = [] shapes = [] sizes = [] prev = 0 for k, v in gym_action_space.spaces.items(): order_gym.append(k) dtypes.append(v.dtype) if isinstance(v, spaces.MultiBinary): low += tuple([0 for _ in range(v.n)]) high += tuple([1 for _ in range(v.n)]) my_size = v.n elif isinstance(v, spaces.Box): low += tuple(v.low) high += tuple(v.high) my_size = v.low.shape[0] else: raise RuntimeError( "Impossible to convert this converter to gym. Type {} of data " "encountered while only MultiBinary and Box are supported for now." ) shapes.append(my_size) sizes.append(np.arange(my_size) + prev) prev += my_size self.__gym_action_space = gym_action_space my_type = spaces.Box(low=np.array(low), high=np.array(high), dtype=dt_float) order_me = [] _order_gym_2_me = np.zeros(my_type.shape[0], dtype=dt_int) - 1 _order_me_2_gym = np.zeros(my_type.shape[0], dtype=dt_int) - 1 for el in self.init_action_space.attr_list_vect: order_me.append(GymActionSpace.keys_grid2op_2_human[el]) prev = 0 order_gym = list(gym_action_space.spaces.keys()) for id_me, nm_attr in enumerate(order_me): id_gym = order_gym.index(nm_attr) index_me = np.arange(shapes[id_gym]) + prev _order_gym_2_me[sizes[id_gym]] = index_me _order_me_2_gym[index_me] = sizes[id_gym] # self.__order_gym_2_me[this_gym_ind] = sizes[id_me] prev += shapes[id_gym] self.__order_gym_2_me = _order_gym_2_me self.__order_me_2_gym = _order_me_2_gym self.__dict_space = {"action": my_type} self.__order_gym = order_gym self.__dtypes_gym = dtypes self.__shapes_gym = shapes
[docs] def get_gym_dict(self): """ Convert this action space int a "gym" action space represented by a dictionary (spaces.Dict) This dictionary counts only one keys which is "action" and inside this action is the """ self._init_gym_converter() return self.__dict_space
[docs] def convert_action_from_gym(self, gymlike_action): """ Convert a gym-like action (ie a Ordered dictionary with one key being only "action") to an action compatible with this converter (in this case a vectorized action). """ vect = gymlike_action["action"] return vect[self.__order_gym_2_me]
[docs] def convert_action_to_gym(self, action): """ Convert a an action of this converter (ie a numpy array) into an action that is usable with an open ai gym (ie a Ordered dictionary with one key being only "action") """ from gym import spaces res = spaces.dict.OrderedDict({"action": action[self.__order_me_2_gym]}) return res