Source code for grid2op.Agent.oneChangeThenNothing

# Copyright (c) 2019-2020, RTE (https://www.rte-france.com)
# See AUTHORS.txt
# This Source Code Form is subject to the terms of the Mozilla Public License, version 2.0.
# If a copy of the Mozilla Public License, version 2.0 was not distributed with this file,
# you can obtain one at http://mozilla.org/MPL/2.0/.
# SPDX-License-Identifier: MPL-2.0
# This file is part of Grid2Op, Grid2Op a testbed platform to model sequential decision making in power systems.

import warnings
from grid2op.Agent.baseAgent import BaseAgent


[docs]class OneChangeThenNothing(BaseAgent):
    """
    .. warning::
        As of grid2op 1.10.2, this class has been deprecated. Please use `env.reset(options={"init state": THE_INITIAl_CHANGE})`
        instead.
    
    This is a specific kind of BaseAgent. It does an BaseAction (possibly non empty) at the first time step and then does
    nothing.

    This class is an abstract class and cannot be instanciated (ie no object of this class can be created). It must
    be overridden and the method :func:`OneChangeThenNothing._get_dict_act` be defined. Basically, it must know
    what action to do.

    Attributes
    ------------
    my_dict: ``dict`` (class member)
        Representation, as a dictionnary of the only action that this Agent will do at the first time step.

    Examples
    ---------
    
    This class is deprecated in favor of the "init state" reset options. Please avoid using it.
    
    But if you really want to use it... then you can do it with:

    .. code-block:: python

        # This class has been deprecated, please use the env.reset()
        # with proper options instead
        
        # DEPRECATED ! 
        import grid2op
        from grid2op.Agent import OneChangeThenNothing
        acts_dict_ = [{}, {"set_line_status": [(0,-1)]}]  # list of dictionaries. Each dictionary
        # represents a valid action

        env = grid2op.make("l2rpn_case14_sandbox")  # create an environment
        for act_as_dict in zip(acts_dict_):
            # generate the proper class that will perform the first action (encoded by {}) in acts_dict_
            agent_class = OneChangeThenNothing.gen_next(act_as_dict)
            
            # start a runner with this agent
            runner = Runner(**env.get_params_for_runner(), agentClass=agent_class)
            # run 2 episode with it
            res_2 = runner.run(nb_episode=2)


    Notes
    ------
    
    After grid2op 1.10.2, this class has been deprecated. A cleaner alternative
    to use it is to set the initial state of grid when calling `env.reset` like this:
    
    .. code-block:: python
    
        import grid2op
        
        env = grid2op.make("l2rpn_case14_sandbox")  # create an environment
        dict_act_json = ...  # dict representing an action
        obs = env.reset(options={"init state": dict_act_json})
    
    This way of doing offers:
    
    - more flexibility: rules are not checked
    - more flexibility: any type of actions acting on anything can be performed
      (even if the action would be illegal for the agent)
    - less trouble: cooldown are not affected
    
    """

    my_dict = {}

    def __init__(self, action_space):
        BaseAgent.__init__(self, action_space)
        cls = type(self)
        warnings.warn(f"Deprecated class, please use `env.reset(options={{'init state': {self.action_space(cls.my_dict).to_json()}, 'method': 'ignore' }})` instead")
        self.has_changed = False
        self.do_nothing_action = self.action_space({})

[docs]    def act(self, observation, reward, done=False):
        if self.has_changed:
            res = self.do_nothing_action
        else:
            res = self.action_space(self._get_dict_act())
            self.has_changed = True
        return res

[docs]    def reset(self, obs):
        self.has_changed = False

[docs]    def _get_dict_act(self):
        """
        Function that need to be overridden to indicate which action to perform.

        Returns
        -------
        res: ``dict``
            A dictionnary that can be converted into a valid :class:`grid2op.BaseAction.BaseAction`. See the help of
            :func:`grid2op.BaseAction.ActionSpace.__call__` for more information.
        """
        return self.my_dict

[docs]    @classmethod
    def gen_next(cls, dict_):
        """
        This function allows to change the dictionnary of the action that the agent will perform.

        See the class level documentation for an example on how to use this.

        Parameters
        ----------
        dict_: ``dict``
            A dictionnary representing an action. This dictionnary is assumed to be convertible into an action.
            No check is performed at this stage.


        """
        cls.my_dict = dict_
        return cls