Magnet
DecLearn
declearn2

Repository

from declearn.optimizer.modules import OptiModule, EWMAModule


class RMSPropModule(OptiModule):
    """[Docstring removed for conciseness]"""

    # Identifier, that must be unique across modules for type-registration
    # purposes. This enables specifying the module in configuration files.

    name:ClassVar[str] = "rmsprop"

    # Define optimizer parameters, here beta and eps

    def __init__(self, beta: float = 0.9, eps: float = 1e-7) -> None:
        """Instantiate the RMSProp gradients-adaptation module.

        Parameters
        ----------
        beta: float
            Beta parameter for the momentum correction
            applied to the adaptive scaling term.
        eps: float, default=1e-7
            Numerical-stability improvement term, added
            to the (divisor) adapative scaling term.
        """

        # Reuse the existing EWMA module, see below

        self.mom = EWMAModule(beta=beta)
        self.eps = eps

    # Allow access to the module's parameters

    def get_config(self,) -> Dict[str, Any]:
        return {"beta": self.ewma.beta, "eps": self.eps}

    # Define the actual transformations of the gradient

    def run(self, gradients: Vector) -> Vector:
        v_t = self.ewma.run(gradients**2)
        scaling = (v_t**0.5) + self.eps
        return gradients / scaling

    # Define the state-access methods; here states are handled by the EWMA

    def get_state(self) -> Dict[str, Any]:
        return self.ewma.get_state()

    def set_state(self, state: Dict[str, Any],) -> None:
        self.ewma.set_state(state)
    def run(self, gradients: Vector) -> Vector:
        self.state = (self.beta * self.state) + ((1 - self.beta) * gradients)
        return self.state