Source code for kgcnn.training.schedule

import keras as ks
import keras.saving
import keras.optimizers.schedules
# from keras_core import ops


[docs]@ks.saving.register_keras_serializable(package='kgcnn', name='LinearWarmupExponentialDecay')
class LinearWarmupExponentialDecay(ks.optimizers.schedules.LearningRateSchedule):
    r"""This schedule combines a linear warmup with an exponential decay.
    Combines :obj:` tf.optimizers.schedules.PolynomialDecay` with an actual increase during warmup
    and :obj:`tf.optimizers.schedules.ExponentialDecay` after.

    Introduced by `DimeNetPP <https://arxiv.org/abs/2011.14115>`__ .

    The closed-from learning rate schedule for learning rate :math:`\eta` for :math:`s_0` warmup and decay
    :math:`S_\tau` is given as a function of steps :math:`s` below (deduced from documentation of keras modules).

    .. math::

        \eta (s) = \eta_0 \;  \gamma ^ {s / S_\tau}  \; [1 - \frac{s_0-1}{s_0} \frac{s_0 - \text{min}(s_0, S)}{s_0}]

    This class has been updated to be compatible with `GemNet <https://arxiv.org/abs/2106.08903>`__ training.

    """

[docs]    def __init__(self, learning_rate, warmup_steps, decay_steps, decay_rate, staircase: bool = False):
        """Initialize class.

        Args:
            learning_rate: Learning rate to use.
            warmup_steps: Number of warmup steps.
            decay_steps: Number of which to decay the learning rate.
            decay_rate: Factor to reduce the learning rate.
            staircase (bool): If True use staircase decay and not (continuous) exponential decay.
        """
        super().__init__()
        self._input_config_settings = {"learning_rate": learning_rate, "warmup_steps": warmup_steps,
                                       "decay_steps": decay_steps, "decay_rate": decay_rate, "staircase": staircase}
        self.warmup = ks.optimizers.schedules.PolynomialDecay(
            1 / warmup_steps, warmup_steps, end_learning_rate=1)
        self.decay = ks.optimizers.schedules.ExponentialDecay(
            learning_rate, decay_steps, decay_rate, staircase=staircase)

[docs]    def __call__(self, step):
        """Decay learning rate as a functions of steps.

        Args:
            step: Current step of training.

        Returns:
            float: New learning rate.
        """
        return self.warmup(step) * self.decay(step)

    @property
    def initial_learning_rate(self):
        return self.decay.initial_learning_rate

    @initial_learning_rate.setter
    def initial_learning_rate(self, value):
        self.decay.initial_learning_rate = value

[docs]    def get_config(self):
        """Get config for this class."""
        config = {}
        config.update(self._input_config_settings)
        return config


[docs]@ks.saving.register_keras_serializable(package='kgcnn', name='KerasPolynomialDecaySchedule')
class KerasPolynomialDecaySchedule(ks.optimizers.schedules.PolynomialDecay):
    r"""This schedule inherits from :obj:` ks.optimizers.schedules.PolynomialDecay` ."""

[docs]    def __init__(self, dataset_size: int, batch_size: int, epochs: int, lr_start: float = 0.0005,
                 lr_stop: float = 1e-5):
        """Initialize class.

        Args:
            dataset_size (int): Size of the dataset.
            batch_size (int): Batch size for training.
            epochs (int): Total epochs to run schedule on.
            lr_start (int): Learning rate at the start.
            lr_stop (int): Final learning rate.
        """
        self._input_config_settings = {"lr_start": lr_start, "lr_stop": lr_stop,
                                       "epochs": epochs, "batch_size": batch_size, "dataset_size": dataset_size}
        steps_per_epoch = dataset_size / batch_size
        num_steps = epochs * steps_per_epoch
        super().__init__(initial_learning_rate=lr_start, decay_steps=num_steps, end_learning_rate=lr_stop)

[docs]    def get_config(self):
        """Get config for this class."""
        config = {}
        config.update(self._input_config_settings)
        return config