* Fixing mean tracked loss

* Adding a PINA progress bar
2024-08-06 12:31:01 +02:00
parent 0fa4e1e58a
commit cce9876751
6 changed files with 194 additions and 36 deletions
--- a/pina/callbacks/init.py
+++ b/pina/callbacks/init.py
@@ -1,5 +1,10 @@
-__all__ = ["SwitchOptimizer", "R3Refinement", "MetricTracker"]
+__all__ = [
+    "SwitchOptimizer",
+    "R3Refinement",
+    "MetricTracker",
+    "PINAProgressBar"
+    ]

 from .optimizer_callbacks import SwitchOptimizer
 from .adaptive_refinment_callbacks import R3Refinement
-from .processing_callbacks import MetricTracker
+from .processing_callbacks import MetricTracker, PINAProgressBar
--- a/pina/callbacks/processing_callbacks.py
+++ b/pina/callbacks/processing_callbacks.py
@@ -1,11 +1,13 @@
 """PINA Callbacks Implementations"""

-from pytorch_lightning.callbacks import Callback
 from pytorch_lightning.core.module import LightningModule
 from pytorch_lightning.trainer.trainer import Trainer
 import torch
 import copy

+from pytorch_lightning.callbacks import Callback, TQDMProgressBar
+from lightning.pytorch.callbacks.progress.progress_bar import get_standard_metrics
+from pina.utils import check_consistency

 class MetricTracker(Callback):

@@ -13,9 +15,11 @@ class MetricTracker(Callback):
        """
        PINA Implementation of a Lightning Callback for Metric Tracking.

-        This class provides functionality to track relevant metrics during the training process.
+        This class provides functionality to track relevant metrics during
+        the training process.

-        :ivar _collection: A list to store collected metrics after each training epoch.
+        :ivar _collection: A list to store collected metrics after each
+        training epoch.

        :param trainer: The trainer object managing the training process.
        :type trainer: pytorch_lightning.Trainer
@@ -28,20 +32,16 @@ class MetricTracker(Callback):
            >>> # ... Perform training ...
            >>> metrics = tracker.metrics
        """
+        super().__init__()
        self._collection = []

-    def on_train_epoch_start(self, trainer, pl_module):
+    def on_train_epoch_end(self, trainer, pl_module):
        """
-        Collect and track metrics at the start of each training epoch. At epoch
-        zero the metric is not saved. At epoch ``k`` the metric which is tracked
-        is the one of epoch ``k-1``.
+        Collect and track metrics at the end of each training epoch. 

        :param trainer: The trainer object managing the training process.
        :type trainer: pytorch_lightning.Trainer
        :param pl_module: Placeholder argument.
-
-        :return: None
-        :rtype: None
        """
        super().on_train_epoch_end(trainer, pl_module)
        if trainer.current_epoch > 0:
@@ -49,23 +49,6 @@ class MetricTracker(Callback):
                copy.deepcopy(trainer.logged_metrics)
            )  # track them

-    def on_train_end(self, trainer, pl_module):
-        """
-        Collect and track metrics at the end of training.
-
-        :param trainer: The trainer object managing the training process.
-        :type trainer: pytorch_lightning.Trainer
-        :param pl_module: Placeholder argument.
-
-        :return: None
-        :rtype: None
-        """
-        super().on_train_end(trainer, pl_module)
-        if trainer.current_epoch > 0:
-            self._collection.append(
-                copy.deepcopy(trainer.logged_metrics)
-            )  # track them
-
    @property
    def metrics(self):
        """
@@ -80,3 +63,91 @@ class MetricTracker(Callback):
            for k in common_keys
        }
        return v
+
+
+class PINAProgressBar(TQDMProgressBar):
+
+    BAR_FORMAT = "{l_bar}{bar}| {n_fmt}/{total_fmt} [{elapsed}<{remaining}, {rate_noinv_fmt}{postfix}]"
+    def __init__(self, metrics='mean', **kwargs):
+        """
+        PINA Implementation of a Lightning Callback for enriching the progress
+        bar.
+
+        This class provides functionality to display only relevant metrics
+        during the training process.
+
+        :param metrics: Logged metrics to display during the training. It should
+            be a subset of the conditions keys defined in
+            :obj:`pina.condition.Condition`.
+        :type metrics: str | list(str) | tuple(str)
+
+        :Keyword Arguments:
+            The additional keyword arguments specify the progress bar
+            and can be choosen from the `pytorch-lightning
+            TQDMProgressBar API <https://lightning.ai/docs/pytorch/stable/_modules/lightning/pytorch/callbacks/progress/tqdm_progress.html#TQDMProgressBar>`_
+
+        Example:
+            >>> pbar = PINAProgressBar(['mean'])
+            >>> # ... Perform training ...
+            >>> trainer = Trainer(solver, callbacks=[pbar])
+        """
+        super().__init__(**kwargs)
+        # check consistency
+        if not isinstance(metrics, (list, tuple)):
+            metrics = [metrics]
+        check_consistency(metrics, str)
+        self._sorted_metrics = metrics
+
+    def get_metrics(self, trainer, pl_module):
+        r"""Combines progress bar metrics collected from the trainer with
+        standard metrics from get_standard_metrics.
+        Implement this to override the items displayed in the progress bar.
+        The progress bar metrics are sorted according to ``metrics``.
+
+        Here is an example of how to override the defaults:
+
+        .. code-block:: python
+
+            def get_metrics(self, trainer, model):
+                # don't show the version number
+                items = super().get_metrics(trainer, model)
+                items.pop("v_num", None)
+                return items
+
+        :return: Dictionary with the items to be displayed in the progress bar.
+        :rtype: tuple(dict)
+
+        """
+        standard_metrics = get_standard_metrics(trainer)
+        pbar_metrics = trainer.progress_bar_metrics
+        if pbar_metrics:
+            pbar_metrics = {
+                key: pbar_metrics[key] for key in self._sorted_metrics
+                }
+        duplicates = list(standard_metrics.keys() & pbar_metrics.keys())
+        if duplicates:
+            rank_zero_warn(
+                f"The progress bar already tracks a metric with the name(s) '{', '.join(duplicates)}' and"
+                f" `self.log('{duplicates[0]}', ..., prog_bar=True)` will overwrite this value. "
+                " If this is undesired, change the name or override `get_metrics()` in the progress bar callback.",
+            )
+
+        return {**standard_metrics, **pbar_metrics}
+    
+    def on_fit_start(self, trainer, pl_module):
+        """
+        Check that the metrics defined in the initialization are available,
+        i.e. are correctly logged.
+
+        :param trainer: The trainer object managing the training process.
+        :type trainer: pytorch_lightning.Trainer
+        :param pl_module: Placeholder argument.
+        """
+        # Check if all keys in sort_keys are present in the dictionary
+        for key in self._sorted_metrics:
+            if key not in trainer.solver.problem.conditions.keys() and key != 'mean':
+                raise KeyError(f"Key '{key}' is not present in the dictionary")
+        # add the loss pedix
+        self._sorted_metrics = [
+            metric + '_loss' for metric in self._sorted_metrics]
+        return super().on_fit_start(trainer, pl_module)