Source code for graphenv.graph_model_bellman_mixin

from graphenv import tf


[docs]class GraphModelBellmanMixin:
    """
    Mixin for use with GraphModel that evaluates the current state as the
    max of the successor state value assessments.
    """

    def _forward_total_value(self):
        """
        Overrides state evaluation, replacing it with a Bellman backup returning
        the max over all successor states's values.

        Returns:
            Tensor of state values.
        """
        return tf.reduce_max(self.action_values, axis=1)