Source code for rl4lms.envs.common.reward


from rl4lms.envs.common.observation import BaseObservation
from abc import ABC, abstractclassmethod
from typing import List


[docs]class RewardFunction(ABC):
[docs]    @abstractclassmethod
    def __call__(self, observation: BaseObservation, action: str, targets: List[str]) -> float:
        """[summary]

        Args:
            observation (Observation): current observation at t
            action (str): current action at t
            targets (List[str]): targets of the current sample

        Returns:
            - a scalar reward
        """
        raise NotImplementedError