Source code for mushroom_rl.utils.callbacks.collect_max_q

from mushroom_rl.utils.callbacks.callback import Callback
import numpy as np


[docs]class CollectMaxQ(Callback):
    """
    This callback can be used to collect the maximum action value in a given
    state at each call.

    """
[docs]    def __init__(self, approximator, state):
        """
        Constructor.

        Args:
            approximator ([Table, EnsembleTable]): the approximator to use;
            state (np.ndarray): the state to consider.

        """
        self._approximator = approximator
        self._state = state

        super().__init__()

[docs]    def __call__(self, dataset):
        q = self._approximator.predict(self._state)
        max_q = np.max(q)

        self._data_list.append(max_q)