Source code for drytorch.trackers.base_classes

"""Module containing abstract classes for trackers."""

import abc
import functools
import pathlib

from collections.abc import Generator, Iterable
from pathlib import Path
from typing import ClassVar, Final, Generic, TypeAlias, TypeVar

import numpy as np
import numpy.typing as npt

from typing_extensions import override

from drytorch.core import exceptions, log_events, tracking


HistoryMetric: TypeAlias = tuple[list[int], list[float]]
HistoryMetrics: TypeAlias = tuple[list[int], dict[str, list[float]]]
SourcedMetric: TypeAlias = dict[str, HistoryMetric]
SourcedMetrics: TypeAlias = dict[str, HistoryMetrics]
NpArray: TypeAlias = npt.NDArray[np.float64]
SourcedArray: TypeAlias = dict[str, NpArray]

Plot = TypeVar('Plot')



[docs]
class Dumper(tracking.Tracker):
    """Tracker with a standard folder structure.

    Attributes:
        folder_name: name of the folder containing the output.
        user_par_dir: parent directory for the tracker data.
        _par_dir: parent directory set by experiment.
        _exp_name: experiment name set by experiment.
        _run_id: run identifier set by experiment.
    """

    folder_name: ClassVar[str] = 'tracker'

    user_par_dir: Path | None
    _par_dir: pathlib.Path | None
    _exp_name: str | None
    _run_id: str | None

    def __init__(self, par_dir: pathlib.Path | None = None) -> None:
        """Initialize.

        Args:
            par_dir: the parent directory for the tracker data. Default uses
                the same of the current experiment.
        """
        super().__init__()
        self.user_par_dir = par_dir
        self._par_dir = None
        self._exp_name = None
        self._run_id = None
        return

    @property
    def par_dir(self) -> pathlib.Path:
        """Return the parent directory for the experiments.

        Raises:
            AccessOutsideScopeError: when the default folder is not available.
        """
        if self.user_par_dir is None:
            if self._par_dir is None:
                raise exceptions.AccessOutsideScopeError()
            path = self._par_dir
        else:
            path = self.user_par_dir

        return path

    @property
    def run_id(self) -> str:
        """Return the identifier for the experiment run.

        Raises:
            AccessOutsideScopeError: when the id of the run is not available.
        """
        if self._run_id is None:
            raise exceptions.AccessOutsideScopeError()

        return self._run_id

    @property
    def exp_name(self) -> str:
        """Return the name of the experiment.

        Raises:
            AccessOutsideScopeError: when the name id not available.
        """
        if self._exp_name is None:
            raise exceptions.AccessOutsideScopeError()

        return self._exp_name


[docs]
    def clean_up(self) -> None:
        """Remove experimental data from the tracker."""
        self._par_dir = None
        self._exp_name = None
        self._run_id = None



[docs]
    @functools.singledispatchmethod
    @override
    def notify(self, event: log_events.Event) -> None:
        return super().notify(event)


    @notify.register
    def _(self, event: log_events.StartExperimentEvent) -> None:
        self._par_dir = event.par_dir
        self._exp_name = event.exp_name
        self._run_id = event.run_id
        self.par_dir.mkdir(exist_ok=True, parents=True)
        return super().notify(event)

    @notify.register
    def _(self, event: log_events.StopExperimentEvent) -> None:
        return super().notify(event)

    def _get_exp_dir(self) -> pathlib.Path:
        exp_dir = self.par_dir / self.folder_name / self.exp_name
        exp_dir.mkdir(exist_ok=True, parents=True)
        return exp_dir

    def _get_run_dir(self, mkdir: bool = True) -> pathlib.Path:
        exp_dir = self._get_exp_dir()
        if '@' in self.run_id:
            day, time = self.run_id.split('@')
            run_dir = exp_dir / day / time
        else:
            run_dir = exp_dir / self.run_id
        if mkdir:
            run_dir.mkdir(exist_ok=True, parents=True)
        return run_dir




[docs]
class MetricLoader(tracking.Tracker, abc.ABC):
    """Interface for trackers that load metrics."""


[docs]
    def load_metrics(
        self, model_name: str, max_epoch: int = -1
    ) -> SourcedMetrics:
        """Load metrics from the last run of the experiment.

        Args:
            model_name: the name of the model.
            max_epoch: the maximum epoch to load. Defaults to all.

        Returns:
            The current epochs and named metric values by the source.

        Raises:
            ValueError: if max_epoch is less than -1.
        """
        if max_epoch == 0:
            return {}

        if max_epoch < -1:
            raise ValueError('Max epoch should not be less than -1.')

        return self._load_metrics(model_name, max_epoch)


    @abc.abstractmethod
    def _load_metrics(
        self, model_name: str, max_epoch: int = -1
    ) -> SourcedMetrics: ...




[docs]
class MemoryMetrics(tracking.Tracker):
    """Keep all metrics in memory.

    Attributes:
        model_dict: all metrics recorded in this session.
    """

    _metric_loader: MetricLoader | None
    model_dict: dict[str, SourcedMetrics]

    def __init__(self, metric_loader: MetricLoader | None = None) -> None:
        """Initialize.

        Args:
            metric_loader: object to load the metrics.
        """
        super().__init__()
        self._metric_loader: Final = metric_loader
        self.model_dict: Final = dict[str, SourcedMetrics]()
        return


[docs]
    @functools.singledispatchmethod
    @override
    def notify(self, event: log_events.Event) -> None:
        return super().notify(event)


    @notify.register
    def _(self, event: log_events.MetricEvent) -> None:
        sourced_metrics = self.model_dict.setdefault(event.model_name, {})
        epochs, logs_dict = sourced_metrics.setdefault(
            event.source_name, ([], {})
        )
        epochs.append(event.epoch)
        for metric_name, metric_value in event.metrics.items():
            logs_dict.setdefault(metric_name, []).append(metric_value)

        return super().notify(event)

    @notify.register
    def _(self, event: log_events.LoadModelEvent) -> None:
        if self._metric_loader is None:
            return None

        metrics = self._metric_loader.load_metrics(
            event.model_name, event.epoch
        )
        self.model_dict[event.model_name] = metrics
        return super().notify(event)




[docs]
class BasePlotter(MemoryMetrics, abc.ABC, Generic[Plot]):
    """Abstract class for plotting trajectory from sources.

    Attributes:
        _model_names: names of the models to plot.
        _source_names: names of the sources to plot.
        _metric_names: names of the metrics to plot.
        _start: epoch from which to start plotting.
        _removed_start: flag indicating if start epochs were removed.
    """

    _model_names: Iterable[str]
    _source_names: Iterable[str]
    _metric_names: Iterable[str]
    _start: int
    _removed_start: bool

    def __init__(
        self,
        model_names: Iterable[str] = (),
        source_names: Iterable[str] = (),
        metric_names: Iterable[str] = (),
        start: int = 1,
        metric_loader: MetricLoader | None = None,
    ) -> None:
        """Initialize.

        Args:
            model_names: the names of the models to plot. Defaults to all.
            source_names: the names of the sources to plot. Defaults to all.
            metric_names: the names of the metrics to plot. Defaults to all.
            start: if positive, the epoch from which to start plotting;
                if negative, the last number of epochs. Defaults to all.
            metric_loader: a tracker that can load metrics from a previous run.

        Note:
            start_epoch allows you to exclude the initial epochs from the graph.
            During the first 2 * start_epoch epochs, the graph is shown in
            its entirety.
        """
        super().__init__(metric_loader)
        self._model_names: Final = model_names
        self._source_names: Final = source_names
        self._metric_names: Final = metric_names
        self._start = start
        self._removed_start = False


[docs]
    @functools.singledispatchmethod
    @override
    def notify(self, event: log_events.Event) -> None:
        return super().notify(event)


    @notify.register
    def _(self, event: log_events.EndEpochEvent) -> None:
        if self._start < 0:
            start: int = max(1, event.epoch + self._start)
        else:
            start = self._start if event.epoch >= 2 * self._start else 1

        self._update_plot(model_name=event.model_name, start=start)
        return super().notify(event)

    @notify.register
    def _(self, event: log_events.EndTestEvent) -> None:
        start = max(1, self._start)
        self._update_plot(model_name=event.model_name, start=start)
        return super().notify(event)


[docs]
    def plot(
        self,
        model_name: str,
        source_names: Iterable[str] = (),
        metric_names: Iterable[str] = (),
        start_epoch: int = 1,
    ) -> list[Plot]:
        """Plot the learning curves.

        Args:
            model_name: the name of the model to plot.
            source_names: the names of the sources to plot. Defaults to all.
            metric_names: the metric to plot. Defaults to all.
            start_epoch: the epoch from which to start plotting.

        Returns:
            References to the plot objects or windows depending on the backend.

        Raises:
            ValueError: if start_epoch is less than 1.
            ValueError: if the model is not found.
        """
        if start_epoch < 1:
            raise ValueError('Start epoch must be positive.')

        sourced_metrics = self.model_dict.get(model_name, {})
        if not sourced_metrics and self._metric_loader is not None:
            sourced_metrics = self._metric_loader.load_metrics(model_name)

        if sourced_metrics:
            self.model_dict[model_name] = sourced_metrics
        else:
            msg = f'No model named {model_name} has been found.'
            raise ValueError(msg)

        return self._plot(model_name, source_names, metric_names, start_epoch)


    def _plot(
        self,
        model_name: str,
        source_names: Iterable[str],
        metric_names: Iterable[str],
        start: int,
    ) -> list[Plot]:
        sourced_metrics = self.model_dict.get(model_name, {})
        if source_names:
            sourced_metrics = {
                source: sourced_metrics[source]
                for source in source_names
                if source in sourced_metrics
            }
        if not metric_names:
            all_metrics: Generator[set[str], None, None] = (
                set(logs[1]) for logs in sourced_metrics.values()
            )
            metric_names = sorted(set().union(*all_metrics))

        plots = list[Plot]()
        self._prepare_layout(model_name, list(metric_names))
        for metric_name in metric_names:
            processed_sources = self._process_source(
                sourced_metrics, metric_name, start
            )
            if processed_sources:
                plots.append(
                    self._plot_metric(
                        model_name, metric_name, **processed_sources
                    )
                )

        return plots

    @abc.abstractmethod
    def _plot_metric(
        self, model_name: str, metric_name: str, **sourced_array: NpArray
    ) -> Plot: ...

    def _prepare_layout(self, model_name: str, metric_names: list[str]) -> None:
        _not_used = model_name, metric_names
        return

    def _process_source(
        self, sourced_metrics: SourcedMetrics, metric_name: str, start: int
    ) -> SourcedArray:
        sourced_metric = self._filter_metric(sourced_metrics, metric_name)
        ordered_sources = self._order_sources(sourced_metric)
        sourced_array = self._source_to_numpy(ordered_sources)
        return self._filter_by_epoch(sourced_array, start)

    def _update_plot(self, model_name: str, start: int) -> None:
        if self._model_names and model_name not in self._model_names:
            return

        self._plot(model_name, self._source_names, self._metric_names, start)
        return

    @classmethod
    def _order_sources(cls, sources: SourcedMetric) -> SourcedMetric:
        return dict(sorted(sources.items(), key=cls._len_source))

    @staticmethod
    def _filter_metric(
        sourced_metrics: SourcedMetrics, metric_name: str
    ) -> SourcedMetric:
        return {
            source_name: (epochs, metrics[metric_name])
            for source_name, (epochs, metrics) in sourced_metrics.items()
            if epochs and metric_name in metrics
        }

    @staticmethod
    def _filter_by_epoch(
        sourced_array: SourcedArray, start: int
    ) -> SourcedArray:
        if start == 1:
            return sourced_array

        filtered = {}
        for name, data in sourced_array.items():
            mask = data[:, 0] >= start  # the epoch is in column 0
            if np.any(mask):
                filtered[name] = data[mask]

        return filtered

    @staticmethod
    def _len_source(source_pair: tuple[str, HistoryMetric]) -> int:
        return -len(source_pair[1][0])  # does not reverse when equal

    @staticmethod
    def _source_to_numpy(sourced_metric: SourcedMetric) -> SourcedArray:
        return {
            name: np.column_stack((epochs, values))
            for name, (epochs, values) in sourced_metric.items()
        }