Source code for paddlets.models.common.callbacks.callbacks

#!/usr/bin/env python3
# -*- coding: UTF-8 -*-
################################################################################
#
# Copyright (c) 2022 Baidu.com, Inc. All Rights Reserved
#
################################################################################

from typing import List, Dict, Any, Optional
import datetime
import time
import copy

import numpy as np

from paddlets.logger import Logger

logger = Logger(__name__)


[docs]class Callback(object):
    """Abstract base class used to build new callbacks.

    Attributes:
        _trainer(PaddleBaseModel): A model instance.
    """
    def __init__(self):
        pass

[docs]    def set_trainer(
        self, 
        model: "PaddleBaseModel"
    ):
        """Set model instance.

        Args:
            model(PaddleBaseModel): A model instance.
        """
        self._trainer = model

[docs]    def on_epoch_begin(
        self, 
        epoch: int, 
        logs: Optional[Dict[str, Any]] = None
    ):
        """Called at the beginning of each epoch.

        Args:
            epoch(int): The index of epoch.
            logs(Dict[str, Any]|None): The logs is a dict or None.
        """
        pass

[docs]    def on_epoch_end(
        self, 
        epoch: int, 
        logs: Optional[Dict[str, Any]] = None
    ):
        """Called at the end of each epoch.

        Args:
            epoch(int): The index of epoch.
            logs(Dict[str, Any]|None): The logs is a dict or None.
                contains `loss` and `metrics`.
        """
        pass

[docs]    def on_batch_begin(
        self, 
        batch: int, 
        logs: Optional[Dict[str, Any]] = None
    ):
        """Called at the beginning of each batch in training.

        Args:
            batch(int): The index of batch.
            logs(Dict[str, Any]|None): The logs is a dict or None.
        """
        pass

[docs]    def on_batch_end(
        self, 
        batch: int, 
        logs: Optional[Dict[str, Any]] = None
    ):
        """Called at the end of each batch in training.

        Args:
            batch(int): The index of batch.
            logs(Dict[str, Any]|None): The logs is a dict or None. 
                contains `loss` and `batch_size`.
        """
        pass

[docs]    def on_train_begin(
        self, 
        logs: Optional[Dict[str, Any]] = None
    ):
        """Called at the start of training.

        Args:
            logs(Dict[str, Any]|None): The logs is a dict or None.
        """
        pass

[docs]    def on_train_end(
        self, 
        logs: Optional[Dict[str, Any]] = None
    ):
        """Called at the end of training.

        Args:
            logs(Dict[str, Any]|None): The logs is a dict or None. 
        """
        pass


[docs]class CallbackContainer(object):
    """Container holding a list of callbacks.

    Args:
        callbacks(List[Callback]): List of callbacks.

    Attributes:
        _callbacks(List[Callback]): List of callbacks.
    """
    def __init__(
        self, 
        callbacks: List[Callback]
    ):
        self._callbacks = callbacks

[docs]    def append(
        self, 
        callback: Callback
    ):
        """Append callback to the container.

        Args:
            callback(Callback): Callback instance.
        """
        self._callbacks.append(callback)

[docs]    def set_trainer(
        self, 
        model: "PaddleBaseModel"
    ):
        """Set model instance.

        Args:
            model(PaddleBaseModel): A model instance.
        """
        self._trainer = model
        for callback in self._callbacks:
            callback.set_trainer(model)

[docs]    def on_epoch_begin(
        self,
        epoch: int,
        logs: Optional[Dict[str, Any]] = None
    ):
        """Called at the beginning of each epoch.

        Args:
            epoch(int): The index of epoch.
            logs(Dict[str, Any]|None): The logs is a dict or None.
        """
        logs = logs or {}
        for callback in self._callbacks:
            callback.on_epoch_begin(epoch, logs)

[docs]    def on_epoch_end(
        self,
        epoch: int,
        logs: Optional[Dict[str, Any]] = None
    ):
        """Called at the end of each epoch.

        Args:
            epoch(int): The index of epoch.
            logs(Dict[str, Any]|None): The logs is a dict or None.
                contains `loss` and `metrics`.
        """
        logs = logs or {}
        for callback in self._callbacks:
            callback.on_epoch_end(epoch, logs)

[docs]    def on_batch_begin(
        self,
        batch: int,
        logs: Optional[Dict[str, Any]] = None
    ):
        """Called at the beginning of each batch in training.

        Args:
            batch(int): The index of batch.
            logs(Dict[str, Any]|None): The logs is a dict or None.
        """
        logs = logs or {}
        for callback in self._callbacks:
            callback.on_batch_begin(batch, logs)

[docs]    def on_batch_end(
        self,
        batch: int,
        logs: Optional[Dict[str, Any]] = None
    ):
        """Called at the end of each batch in training.

        Args:
            batch(int): The index of batch.
            logs(Dict[str, Any]|None): The logs is a dict or None.
                contains `loss` and `batch_size`.
        """
        logs = logs or {}
        for callback in self._callbacks:
            callback.on_batch_end(batch, logs)

[docs]    def on_train_begin(
        self,
        logs: Optional[Dict[str, Any]] = None
    ):
        """Called at the start of training.

        Args:
            logs(Dict[str, Any]|None): The logs is a dict or None.
        """
        logs = logs or {}
        for callback in self._callbacks:
            callback.on_train_begin(logs)

[docs]    def on_train_end(
        self,
        logs: Optional[Dict[str, Any]] = None
    ):
        """Called at the end of training.

        Args:
            logs(Dict[str, Any]|None): The logs is a dict or None.
        """
        logs = logs or {}
        for callback in self._callbacks:
            callback.on_train_end(logs)


[docs]class EarlyStopping(Callback):
    """EarlyStopping callback, allow the trainer to exit the training loop 
    if the given metric stopped improving during evaluation.

    Args:
        early_stopping_metric(str): Early stopping metric name.
        is_maximize(bool): Whether to maximize or not early_stopping_metric.
        tol(float): Minimum change in monitored value to qualify as improvement.
            This number should be positive.
        patience(int): Number of epochs to wait for improvement before terminating.
            the counter be reset after each improvement

    Attributes:
        _early_stopping_metric(str): Early stopping metric name.
        _is_maximize(bool): Whether to maximize or not early_stopping_metric.
        _tol(float): Minimum change in monitored value to qualify as improvement.
        _patience(int): Number of epochs to wait for improvement before terminating.
        _best_epoch(int): Best epoch.
        _stopped_epoch(int): Stopped epoch.
        _best_loss(float): Best loss.
        _wait(int): Number of times that the early_stopping_metric failed to improve.
    """
    def __init__(
        self, 
        early_stopping_metric: str,
        is_maximize: bool,
        tol: float = 0.,
        patience: int = 1
    ):
        super(EarlyStopping, self).__init__()
        self._early_stopping_metric = early_stopping_metric
        self._is_maximize = is_maximize
        self._tol = tol
        self._patience = patience
        self._best_epoch = 0
        self._stopped_epoch = 0
        self._best_weights = None
        self._best_loss = np.inf
        self._wait = 0
        if self._is_maximize:
            self._best_loss = -self._best_loss

[docs]    def on_epoch_end(
        self,
        epoch: int,
        logs: Optional[Dict[str, Any]] = None
    ):
        """Called at the end of each epoch.

        Args:
            epoch(int): The index of epoch.
            logs(Dict[str, Any]|None): The logs is a dict or None.
                contains `loss` and `metrics`.
        """
        current_loss = logs.get(self._early_stopping_metric)
        if current_loss is None:
            # raise KeyError(f"{self._early_stopping_metric} is not available, choose in {self._trainer._metrics_names}.")
            return 

        loss_change = current_loss - self._best_loss
        max_improved = self._is_maximize and loss_change > self._tol
        min_improved = (not self._is_maximize) and (-loss_change > self._tol)
        if max_improved or min_improved:
            self._best_weights = copy.deepcopy(self._trainer._network.state_dict())
            self._best_loss = current_loss
            self._best_epoch = epoch
            self._wait = 0
        else:
            self._wait += 1
            if self._wait >= self._patience:
                self._trainer._stop_training = True
                self._stopped_epoch = epoch

[docs]    def on_train_end(
        self,
        logs: Optional[Dict[str, Any]] = None
    ):
        """Called at the end of training.

        Args:
            logs(Dict[str, Any]|None): The logs is a dict or None.
        """
        self._trainer._best_epoch = self._best_epoch
        self._trainer._best_cost = self._best_loss
        if self._best_weights is not None:
            self._trainer._network.set_state_dict(self._best_weights)
        if self._stopped_epoch > 0:
            msg = f"\nEarly stopping occurred at epoch {self._stopped_epoch}"
            msg += (
                f" with best_epoch = {self._best_epoch} and " \
                + f"best_{self._early_stopping_metric} = {self._best_loss:.6f}"
            )
            logger.info(msg)
        else:
            msg = (
                f"Stop training because you reached max_epochs = {self._trainer._max_epochs}" \
                + f" with best_epoch = {self._best_epoch} and " \
                + f"best_{self._early_stopping_metric} = {self._best_loss:.6f}" 
            )
            logger.info(msg)
        logger.info("Best weights from best epoch are automatically used!")


[docs]class History(Callback):
    """Callback that records events into a `History` object.

    Args:
        verbose(int): Print results every verbose iteration.

    Attributes:
        _verbose(int): Print results every verbose iteration.
        _history(Dict[str, Any]): Record all information of metrics of each epoch.
        _start_time(float): Start time of training.
        _epoch_loss(float): Average loss per epoch.
        _epoch_metrics(Dict[str, Any]): Record all information of metrics of each epoch.
        _samples_seen(int): Traversed samples.
    """
    def __init__(
        self, 
        verbose: int = 1
    ):
        super(History, self).__init__()
        self._verbose = verbose

[docs]    def on_train_begin(
        self,
        logs: Optional[Dict[str, Any]] = None
    ):
        """Called at the start of training.

        Args:
            logs(Dict[str, Any]|None): The logs is a dict or None.
        """
        self._history = {"loss": [], "lr": []}
        self._start_time = logs["start_time"]
        self._epoch_loss = 0. # nqa

[docs]    def on_epoch_begin(
        self,
        epoch: int,
        logs: Optional[Dict[str, Any]] = None
    ):
        """Called at the beginning of each epoch.

        Args:
            epoch(int): The index of epoch.
            logs(Dict[str, Any]|None): The logs is a dict or None.
        """
        self._epoch_metrics = {"loss": 0.} # nqa
        self._samples_seen = 0.

[docs]    def on_epoch_end(
        self,
        epoch: int,
        logs: Optional[Dict[str, Any]] = None
    ):
        """Called at the end of each epoch.

        Args:
            epoch(int): The index of epoch.
            logs(Dict[str, Any]|None): The logs is a dict or None.
                contains `loss` and `metrics`.
        """
        self._epoch_metrics["loss"] = self._epoch_loss
        for metric_name, metric_value in self._epoch_metrics.items():
            if metric_name not in self._history:
                self._history.update({metric_name: []})
            self._history[metric_name].append(metric_value)

        if self._verbose == 0 or epoch % self._verbose != 0:
            return

        msg = f"epoch {epoch:0>3}"
        for metric_name, metric_value in self._epoch_metrics.items():
            if metric_name != "lr":
                msg += f"| {metric_name:<3}: {metric_value:.6f}"
        total_time = int(time.time() - self._start_time)
        msg += f"| {str(datetime.timedelta(seconds=total_time)) + 's':<6}"
        logger.info(msg)

[docs]    def on_batch_end(
        self,
        batch: int,
        logs: Optional[Dict[str, Any]] = None
    ):
        """Called at the end of each batch in training.

        Args:
            batch(int): The index of batch.
            logs(Dict[str, Any]|None): The logs is a dict or None.
                contains `loss` and `batch_size`.
        """
        batch_size = logs["batch_size"]
        self._epoch_loss = (
            self._samples_seen * self._epoch_loss + batch_size * logs["loss"]
        ) / (self._samples_seen + batch_size)
        self._samples_seen += batch_size