Source code for smartgrid.observation.global_observation

"""
Global observations of the World, shared by all Agents in the smart grid.
"""

import dataclasses
from typing import ClassVar, Optional

import numpy as np

from smartgrid.observation.base_observation import BaseObservation
from smartgrid.util import hoover



[docs]
@dataclasses.dataclass(frozen=True)
class GlobalObservation(BaseObservation):
    """
    Global observations of the World, shared by all Agents in the smart grid.

    Observations cannot be modified once created, to limit potential bugs.
    Global observations are not directly linked to a particular agent, but
    rather to the whole society of agents in the :py:class:`.World`, i.e.,
    in this smart grid. Thus, the measures are the same for all agents.

    To optimize computations, we thus create global observations only once
    each step. This is done through the :py:attr:`.last_step_compute` and
    :py:attr:`.computed` *class* attributes. We emphasize that they should
    **not** be accessed through an instance, as they are not relevant as
    observations, merely to *compute observations*.

    A global observation contains the following measures:

    hour
        The current hour in the simulated world. It is computed as a ratio
        between 0 and 1, and days are ignored by using a modulo.
        Specifically, assuming that the current time step is ``t``, the *hour*
        measure is computed as ``(t % 24) / 24``.

    available_energy
        The quantity of energy available in the grid, which is accessible to
        all agents. This is a large pool of energy, however they should avoid
        over-consuming it, and take an appropriate quantity so as to let
        other agents profit as well.
        This measure is normalized as a value between 0 and 1, from the *real*
        available quantity, w.r.t. the bounds of energy that could have been
        generated at this step. See the :py:mod:`.energy_generator` module
        for more details on energy generators, and their bounds.

    equity
        The equity of comforts between all agents in the grid, i.e., to which
        degree do they have a similar comfort. It is computed as a statistical
        indicator of dispersion named the
        `Hoover index <https://en.wikipedia.org/wiki/Hoover_index>`_, which
        is a well-known tool in economy, originally made to describe income
        inequality.
        ``equity`` is computed as ``1 - hoover(comforts)``, such that 0
        represents a perfect inequality (one person has everything, the others
        nothing), and 1 a perfect equality (everybody has the same comfort).

    energy_loss
        The quantity of energy that was available to agents, but not used
        (i.e., neither consumed nor stored) at this time step.

    autonomy
        This measure represents the autonomy, or self-sustainability, of the
        smart grid. It is measured based on the transactions (i.e., selling or
        buying energy from and to the national grid), w.r.t. the total amount
        of energy exchanged within the grid (given, stored, consumed).

    exclusion
        The proportion of agents that have a comfort lower than half the median
        of agents' comforts. Such agents are said to be *excluded*.

    well_being
        The median of all agents' comfort. Using a median rather than an average
        reduces the impact of outliers.

    over_consumption
        The quantity of energy that agents have consumed, but was not
        originally available in the grid. We assume that the grid automatically
        bought this missing energy from the national grid.
        It is computed as the sum of energy consumed from the grid and stored
        from the grid, by all agents, minus the sum of energy given by all
        agents, and the energy initially available, divided by the sum of
        energy taken by all agents, to obtain a ratio between 0 and 1.
        If the measure is less than 0, we set it to 0.
    """

    # Instance attributes = observations measures

    hour: float
    """The current hour, represented in ``[0,1]``."""

    available_energy: float
    """The ratio of available energy in the Grid, compared to the maximum possible."""

    equity: float
    """The equity, a statistical measure of dispersion, between agents' comforts."""

    energy_loss: float
    """The ratio of energy not consumed over the total energy exchanges."""

    autonomy: float
    """
    The ratio of exchanges that are not with the national grid, over the total exchanges.
    """

    exclusion: float
    """The proportion of agents with a comfort less than half the median."""

    well_being: float
    """The median of agents' comforts."""

    over_consumption: float
    """The ratio of energy consumed that was not available, over the total exchanges."""

    # Class attributes = used to memorize observations

    last_step_compute: ClassVar[int] = -1
    """
    Last time step at which global observations were computed.
    
    This is used to optimize the computations and avoid re-computing already
    known observations, since these are the same for all agents at a given
    time step.
    """

    computed: ClassVar[Optional['Self']] = None
    """
    Memoized global observations, computed at the time step indicated by
    :py:attr:`.last_step_compute`.
    """


[docs]
    @classmethod
    def _is_compute(cls, world: 'World') -> bool:
        """
        Private method to know whether the current step has already been computed.
        """
        return world.current_step == cls.last_step_compute



[docs]
    @classmethod
    def compute(cls, world: 'World') -> 'Self':
        """
        Return the global observations computed from the World state.

        This method uses memoization through :py:attr:`.computed`,
        :py:meth:`._is_compute` and :py:attr:`.last_step_compute` to avoid
        re-computing already known observations. In such cases, the cached
        instance is returned. Otherwise, measures are computed, and a new
        instance is created, memoized, and returned.

        :type world: smartgrid.world.World
        :param world: The World for which we want to compute the global
            observations.

        :rtype: GlobalObservation
        """
        # return directly if the step have been computed
        if cls._is_compute(world):
            return cls.computed

        # Pre-compute some intermediate data
        comforts = []
        sum_taken, sum_given, sum_transactions, sum_consumed, sum_stored = 0, 0, 0, 0, 0
        for a in world.agents:
            comforts.append(a.state.comfort)
            sum_taken += a.enacted_action.grid_consumption + a.enacted_action.store_energy
            sum_given += a.enacted_action.give_energy
            sum_transactions += a.enacted_action.buy_energy + a.enacted_action.sell_energy
            sum_consumed += a.enacted_action.grid_consumption + a.enacted_action.storage_consumption
            sum_stored += a.enacted_action.store_energy

        # Compute some common measures about env
        hour = (world.current_step % 24) / 24
        available_energy = np.interp(
            world.available_energy,
            world.energy_generator.available_energy_bounds(
                world.current_need,
                world.current_step,
                world.min_needed_energy,
                world.max_needed_energy
            ),
            (0, 1)
        )
        equity = 1.0 - hoover(comforts)

        over_consumption = max(0.0, sum_taken - sum_given - world.available_energy)
        over_consumption /= (sum_taken + 10E-300)

        energy_loss = max(0.0, -over_consumption)

        autonomy = 1.0 - sum_transactions / (sum_consumed + sum_stored
                                             + sum_given + sum_transactions + 10E-300)

        well_being = np.median(comforts)
        if np.isnan(well_being):
            well_being = 0.0

        threshold = well_being / 2
        exclusion = len([c for c in comforts if c < threshold]) / len(comforts)

        cls.last_step_compute = world.current_step
        cls.computed = cls(
            hour=hour,
            available_energy=available_energy,
            equity=equity,
            energy_loss=energy_loss,
            autonomy=autonomy,
            exclusion=exclusion,
            well_being=well_being,
            over_consumption=over_consumption,
        )
        return cls.computed



[docs]
    @classmethod
    def reset(cls):
        """
        Reset the counter of steps computed, i.e., the memoization.
        """
        cls.last_step_compute = -1
        # We also reset the memoized value, just to make it clear that it
        # is no longer the correct value. Since the counter is set to `-1`,
        # it should not be used anyway...
        cls.computed = None