Add ClearMLLogger (#568)

* Add clearml logger implementation * Stable version * Add iterations and series logic * Add tmp results * WIP: basic functionality * WIP: logging for parallel backtest * formatting * added tests * updated examples * fixed spelling * updated warnings to ignore * updated lock file * fixed spelling * updated holiday tests * added deprecation warnings to ignore list * fixed tests * review fixes * updated docs * added tests * updated changelog * updated docs --------- Co-authored-by: Aleksandr Chikov <[email protected]> Co-authored-by: Чиков Александр Павлович <[email protected]>
etna-team · Jan 24, 2025 · 5630cab · 5630cab
1 parent ca1dc4e
commit 5630cab
Show file tree

Hide file tree

Showing 23 changed files with 4,463 additions and 3,172 deletions.
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -7,7 +7,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 
 ## Unreleased
 ### Added
-- 
+- Add `ClearMLLogger` ([#568](https://github.com/etna-team/etna/pull/568))
 - 
 - 
 - 

diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
@@ -116,7 +116,7 @@ Useful links:
 1. [ReST Quickref](https://docutils.sourceforge.io/docs/user/rst/quickref.html)
 2. [ReST Roles](https://www.sphinx-doc.org/en/master/usage/restructuredtext/roles.html)
 3. [ReST Cross-referencing Python objects](https://www.sphinx-doc.org/en/master/usage/restructuredtext/domains.html#cross-referencing-python-objects)
-4. [Matplotlib Cheetsheet](https://matplotlib.org/sampledoc/cheatsheet.html)
+4. [Matplotlib Cheatsheet](https://matplotlib.org/sampledoc/cheatsheet.html)
 5. [Sklearn example](https://github.com/scikit-learn/scikit-learn/blob/37ac6788c/sklearn/linear_model/_ridge.py#L321)
 
 The simplest way to check how documentation is rendered is to make a pull request. 

diff --git a/docs/source/api_reference/loggers.rst b/docs/source/api_reference/loggers.rst
@@ -22,6 +22,7 @@ Loggers:
    LocalFileLogger
    S3FileLogger
    WandbLogger
+   ClearMLLogger
 
 There is global object :code:`tslogger` that can be imported. It has a class:
 

diff --git a/docs/source/api_reference/settings.rst b/docs/source/api_reference/settings.rst
@@ -19,9 +19,12 @@ All available installation options:
         pip install "etna[prophet]"
         pip install "etna[torch]"
         pip install "etna[wandb]"
+        pip install "etna[clearml]"
         pip install "etna[auto]"
         pip install "etna[classification]"
         pip install "etna[statsforecast]"
+        pip install "etna[chronos]"
+        pip install "etna[timesfm]"
         pip install "etna[all]"
 
 .. note::

diff --git a/docs/source/installation.rst b/docs/source/installation.rst
@@ -26,6 +26,7 @@ Available user extensions are the following:
 - ``classiciation``: adds time series classification functionality,
 - ``chronos``: adds Chronos-like pretrained models,
 - ``timesfm``: adds TimesFM pretrained models.
+- ``clearml``: adds ClearML logger with tensorboard support
 
 Install extension:
 

diff --git a/etna/datasets/tsdataset.py b/etna/datasets/tsdataset.py
@@ -786,7 +786,7 @@ def to_flatten(df: pd.DataFrame, features: Union[Literal["all"], Sequence[str]]
         features:
             List of features to return.
             If "all", return all the features in the dataset.
-            Always return columns with timestamp and segemnt.
+            Always return columns with timestamp and segment.
         Returns
         -------
         pd.DataFrame:

diff --git a/etna/loggers/__init__.py b/etna/loggers/__init__.py
@@ -17,11 +17,12 @@
 """
 from etna import SETTINGS
 from etna.loggers.base import _Logger
+from etna.loggers.base import tslogger
 from etna.loggers.console_logger import ConsoleLogger
 from etna.loggers.file_logger import LocalFileLogger
 from etna.loggers.file_logger import S3FileLogger
 
 if SETTINGS.wandb_required:
     from etna.loggers.wandb_logger import WandbLogger
-
-tslogger = _Logger()
+if SETTINGS.clearml_required:
+    from etna.loggers.clearml_logger import ClearMLLogger
diff --git a/etna/loggers/base.py b/etna/loggers/base.py
@@ -186,3 +186,14 @@ def disable(self):
         self.loggers = []
         yield
         self.loggers = temp_loggers
+
+    @contextmanager
+    def capture_tslogger(self):
+        """Context manager to capture global logger."""
+        parent_loggers = tslogger.loggers
+        tslogger.loggers = self.loggers
+        yield
+        tslogger.loggers = parent_loggers
+
+
+tslogger = _Logger()
diff --git a/etna/loggers/clearml_logger.py b/etna/loggers/clearml_logger.py
@@ -0,0 +1,301 @@
+import base64
+import logging
+from typing import TYPE_CHECKING
+from typing import Any
+from typing import Dict
+from typing import Mapping
+from typing import Optional
+from typing import Sequence
+from typing import Union
+from uuid import uuid4
+
+import pandas as pd
+
+from etna.loggers.base import BaseLogger
+
+if TYPE_CHECKING:
+    from clearml.task import Task
+
+    from etna.datasets import TSDataset
+
+
+class ClearMLLogger(BaseLogger):
+    """ClearML logger.
+
+    Note
+    ----
+    This logger requires ``clearml`` extension to be installed.
+    Read more about this at :ref:`installation page <installation>`.
+
+    Warning
+    -------
+    There is a possibility, that aggregated metrics charts may log incorrectly.
+    For more details see `issue <https://github.com/etna-team/etna/issues/579>`_.
+    """
+
+    def __init__(
+        self,
+        project_name: Optional[str] = None,
+        task_name: Optional[str] = None,
+        task_name_prefix: str = "",
+        task_type: str = "training",
+        tags: Optional[Sequence[str]] = None,
+        output_uri: Optional[Union[str, bool]] = None,
+        auto_connect_frameworks: Union[bool, Mapping[str, Union[bool, str, list]]] = False,
+        auto_resource_monitoring: Union[bool, Mapping[str, Any]] = True,
+        auto_connect_streams: Union[bool, Mapping[str, bool]] = True,
+        plot: bool = True,
+        table: bool = True,
+        config: Optional[Dict[str, Any]] = None,
+        save_dir: Optional[str] = None,
+    ):
+        """Create instance of ``ClearMLLogger``.
+
+        Parameters
+        ----------
+        project_name:
+            The name of the project in which the experiment will be created.
+        task_name
+            The name of Task (experiment).
+        task_name_prefix:
+            Prefix for the Task name field.
+        task_type:
+            The task type.
+        tags:
+             Add a list of tags (str) to the created Task.
+        output_uri:
+            The default location for output models and other artifacts.
+        auto_connect_frameworks:
+            Automatically connect frameworks.
+        auto_resource_monitoring:
+            Automatically create machine resource monitoring plots.
+        auto_connect_streams:
+            Control the automatic logging of stdout and stderr.
+        plot:
+            Indicator for making and sending plots.
+        table:
+            Indicator for making and sending tables.
+        config:
+            A dictionary-like object for saving inputs to your job,
+            like hyperparameters for a model or settings for a data preprocessing job.
+        save_dir:
+            Path to the directory for saving intermediate data. Used only when logging DL models.
+            Defaults to ``./tb_save``
+
+        Notes
+        -----
+        For more details see `documentation <https://clear.ml/docs/latest/docs/references/sdk/task/#taskinit>`_
+
+        """
+        super().__init__()
+        self.project_name = project_name
+        self.task_name = (
+            task_name_prefix + base64.urlsafe_b64encode(uuid4().bytes).decode("utf8").rstrip("=\n")[:8]
+            if task_name is None
+            else task_name
+        )
+        self.task_name_prefix = task_name_prefix
+        self.task_type = task_type
+        self.tags = tags
+        self.output_uri = output_uri
+        self.auto_connect_frameworks = auto_connect_frameworks
+        self.auto_resource_monitoring = auto_resource_monitoring
+        self.auto_connect_streams = auto_connect_streams
+        self.plot = plot
+        self.table = table
+        self.config = config
+        self.save_dir = "./tb_save" if save_dir is None else save_dir
+
+        self._pl_logger = None
+        self._job_type: Optional[str] = None
+        self._fold_id: Optional[Union[str, int]] = None
+
+        self._task: Optional["Task"] = None
+        self.init_task()
+
+    def log(self, msg: Union[str, Dict[str, Any]], **kwargs):
+        """Log any event.
+
+        This class logs string representation of a message.
+
+        Parameters
+        ----------
+        msg:
+            Message or dict to log
+        kwargs:
+            Additional parameters for particular implementation
+        """
+        level = kwargs.get("level", logging.INFO)
+        print_console = kwargs.get("print_console", True)
+        self._get_logger().report_text(
+            msg=str(msg) if not isinstance(msg, str) else msg, level=level, print_console=print_console
+        )
+
+    def log_backtest_metrics(
+        self, ts: "TSDataset", metrics_df: pd.DataFrame, forecast_df: pd.DataFrame, fold_info_df: pd.DataFrame
+    ):
+        """Write metrics to logger.
+
+        Parameters
+        ----------
+        ts:
+            TSDataset to with backtest data
+        metrics_df:
+            Dataframe produced with :py:meth:`etna.pipeline.Pipeline._get_backtest_metrics`
+        forecast_df:
+            Forecast from backtest
+        fold_info_df:
+            Fold information from backtest
+        """
+        from etna.analysis import plot_backtest_interactive
+        from etna.metrics.utils import aggregate_metrics_df
+
+        if self._job_type is None:
+            raise ValueError(
+                "Experiment is not properly initialized! Ensure that ``start_experiment`` is called before logging backtest results."
+            )
+
+        logger = self._get_logger()
+
+        if self.table:
+            logger.report_table(title="Fold info", series=self._job_type, table_plot=fold_info_df)
+
+        if self.plot:
+            fig = plot_backtest_interactive(forecast_df, ts, history_len=100)
+            logger.report_plotly(title="Backtest forecast", series=self._job_type, figure=fig)
+
+        metrics_dict = aggregate_metrics_df(metrics_df)
+        for metric, value in metrics_dict.items():
+            logger.report_single_value(name=metric, value=value)
+
+    def log_backtest_run(self, metrics: pd.DataFrame, forecast: pd.DataFrame, test: pd.DataFrame):
+        """Backtest metrics from one fold to logger.
+
+        Parameters
+        ----------
+        metrics:
+            Dataframe with metrics from backtest fold
+        forecast:
+            Dataframe with forecast
+        test:
+            Dataframe with ground truth
+        """
+        from etna.datasets import TSDataset
+        from etna.metrics.utils import aggregate_metrics_df
+
+        if self._job_type is None or self._fold_id is None:
+            raise ValueError(
+                "Experiment is not properly initialized! Ensure that ``start_experiment`` is called before logging backtest run."
+            )
+
+        columns_name = list(metrics.columns)
+        metrics = metrics.reset_index()
+        metrics.columns = ["segment"] + columns_name
+
+        logger = self._get_logger()
+        if self.table:
+            logger.report_table(
+                title="Metrics per fold", series=f"{self._job_type} Fold - {self._fold_id}", table_plot=metrics
+            )
+            logger.report_table(
+                title="Forecasts per fold",
+                series=f"{self._job_type} Fold - {self._fold_id}",
+                table_plot=TSDataset.to_flatten(forecast),
+            )
+            logger.report_table(
+                title="Test folds",
+                series=f"{self._job_type} Fold - {self._fold_id}",
+                table_plot=TSDataset.to_flatten(test),
+            )
+
+        if isinstance(self._fold_id, int):
+            metrics_dict = aggregate_metrics_df(metrics)
+            for metric, value in metrics_dict.items():
+                logger.report_scalar(title=metric, series=self._job_type, iteration=self._fold_id, value=value)
+        else:
+            self.log(
+                msg="Logging of scalars requires integer fold ids! Aggregated metrics logging would be skipped!",
+                level=logging.WARNING,
+            )
+
+    def start_experiment(self, job_type: Optional[str] = None, group: Optional[str] = None, *args, **kwargs):
+        """Start ``Task``.
+
+        Complete logger initialization or reinitialize it before the next experiment with the same name.
+
+        Parameters
+        ----------
+        job_type:
+            Specify the type of task, which is useful when you're grouping runs together
+            into larger experiments using group.
+        group:
+            Specify a group to organize individual tasks into a larger experiment.
+        """
+        self._job_type = job_type
+
+        if group is not None:
+            try:
+                self._fold_id = int(group)
+            except ValueError:
+                self._fold_id = group
+
+        # Overwrites current pl_logger if any
+        self._pl_logger = None
+
+        if self._task is None:
+            self.init_task()
+
+    def init_task(self):
+        """Reinit ``Task``."""
+        from clearml import Task
+        from clearml import TaskTypes
+
+        auto_connect_frameworks = {
+            "tensorboard": True,  # for DL models, that use pytorch lightning
+            "joblib": True,  # for backtest with multiple jobs
+        }
+        if isinstance(self.auto_connect_frameworks, Mapping):
+            auto_connect_frameworks = {**auto_connect_frameworks, **self.auto_connect_frameworks}
+
+        self._task = Task.init(
+            project_name=self.project_name,
+            task_name=self.task_name,
+            task_type=TaskTypes[self.task_type],
+            tags=self.tags,
+            output_uri=self.output_uri,
+            auto_connect_frameworks=auto_connect_frameworks,
+            auto_resource_monitoring=self.auto_resource_monitoring,
+            auto_connect_streams=self.auto_connect_streams,
+            reuse_last_task_id=False,
+        )
+        if self.config is not None:
+            self._task.connect(mutable=self.config)
+
+    def finish_experiment(self, *args, **kwargs):
+        """Finish ``Task``."""
+        # flush all data for additionally spawned tasks
+        if (self._task is not None) and (not self._task.is_main_task()):
+            self._task.flush(wait_for_uploads=True)
+
+        self._job_type = None
+        self._fold_id = None
+        self._pl_logger = None
+
+    def _get_logger(self):
+        """Return internal task logger."""
+        if self._task is None:
+            raise ValueError("ClearML task is not initialized!")
+        return self._task.current_task().get_logger()
+
+    @property
+    def pl_logger(self):
+        """Pytorch lightning loggers."""
+        if self._pl_logger is None:
+            from pytorch_lightning.loggers import TensorBoardLogger
+
+            prefix = "" if self._fold_id is None else f"Fold-{self._fold_id}"
+            self._pl_logger = TensorBoardLogger(
+                save_dir=self.save_dir, name=self.task_name, prefix=prefix, version=prefix
+            )
+
+        return self._pl_logger
diff --git a/etna/models/sarimax.py b/etna/models/sarimax.py
@@ -406,7 +406,7 @@ def forecast_components(self, df: pd.DataFrame) -> pd.DataFrame:
         state = forecast_results.predicted_state[:, :-1]
 
         if model.mle_regression:
-            # If there are no exog variales `mle_regression` will be set to `False`
+            # If there are no exog variables `mle_regression` will be set to `False`
             # even if user set to `True`.
             components = self._mle_regression_decomposition(
                 state=state, ssm=forecast_results.model, exog=exog_future.values  # type: ignore
-Original file line number
+Diff line change
@@ Expand Up @@
     ## Unreleased
     ### Added
-    -
+    - Add `ClearMLLogger` ([#568](https://github.com/etna-team/etna/pull/568))
     -
     -
     -
@@ Expand Down @@