FIX Galileo-Galilei#9 MlflowMetricsDataSet implemented.

akruszewski · Aug 24, 2020 · 8861950 · 8861950
1 parent 379b617
commit 8861950
Show file tree

Hide file tree

Showing 6 changed files with 391 additions and 1 deletion.
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -2,6 +2,10 @@
 
 ## [Unreleased]
 
+### Added
+
+- Add dataset ``MlflowMetricsDataSet`` for metrics logging ([#9](https://github.com/Galileo-Galilei/kedro-mlflow/issues/9)) and update documentation for metrics.`
+
 ## [0.2.1] - 2018-08-06
 
 ### Added

diff --git a/docs/source/03_tutorial/07_version_metrics.md b/docs/source/03_tutorial/07_version_metrics.md
@@ -1,3 +1,62 @@
 # Version metrics
 
-This is coming soon. If you want to keep track of the progress on this feature, [follow this issue](https://github.com/Galileo-Galilei/kedro-mlflow/issues/9).
+## What is metric tracking?
+
+Mlflow defines metrics as "Key-value metrics, where the value is numeric. Each metric can be updated throughout the course of the run (for example, to track how your model’s loss function is converging), and MLflow records and lets you visualize the metric’s full history".
+
+## How to version metrics in a kedro project?
+
+kedro-mlflow introduces a new ``AbstractDataSet`` called ``MlflowMetricsDataSet``. It is wrapper around dictionary with metrics which is returned by node and log metrics in MLflow.
+
+Since it is a ``AbstractDataSet``, it can be used with the YAML API. You can define it as:
+
+```yaml
+my_model_metrics:
+    type: kedro_mlflow.io.MlflowMetricsDataSet
+```
+
+It can get also ``prefix`` configuration option. This is useful especially when your pipeline evaluate metrics on different datasets. For example:
+
+```yaml
+my_model_metrics_dev:
+    type: kedro_mlflow.io.MlflowMetricsDataSet
+    prefix: dev
+my_model_metrics_test:
+    type: kedro_mlflow.io.MlflowMetricsDataSet
+    prefix: test
+```
+
+In that scenario metrics will be available in MLflow with given prefixes. For example your ``accuracy`` metric from example above, for ``my_model_metrics_test`` will be stored under key ``test.accuracy``, for ``my_model_metrics_dev``, under key ``dev.accuracy``.
+
+## How to return metrics from node?
+
+Let assume that you have node which doesn't have any inputs and returns dictionary with metrics to log:
+
+```python
+def metrics_node() -> Dict[str, Union[float, List[float]]]:
+    return {
+        "metric1": 1.0,
+        "metric2": [1.0, 1.1]
+    }
+```
+
+As you can see above, ``kedro_mlflow.io.MlflowMetricsDataSet`` can take as metrics ``floats`` or ``lists`` of ``floats``. In first case under the given metric key just one value will be logged, in second a series of values.
+
+To store metrics we need to define metrics dataset in Kedro Catalog:
+
+```yaml
+my_model_metrics:
+    type: kedro_mlflow.io.MlflowMetricsDataSet
+```
+
+To fulfill example we also need pipeline which will use this node and store metrics under ``my_model_metrics`` name.
+
+```python
+def create_pipeline() -> Pipeline:
+    return Pipeline(node(
+        func=metrics_node,
+        inputs=None,
+        outputs="my_model_metrics",
+        name="log_metrics",
+    ))
+```
diff --git a/kedro_mlflow/framework/hooks/pipeline_hook.py b/kedro_mlflow/framework/hooks/pipeline_hook.py
@@ -10,6 +10,7 @@
 from kedro.versioning.journal import _git_sha
 
 from kedro_mlflow.framework.context import get_mlflow_config
+from kedro_mlflow.io import MlflowMetricsDataSet
 from kedro_mlflow.mlflow import KedroPipelineModel
 from kedro_mlflow.pipeline.pipeline_ml import PipelineML
 from kedro_mlflow.utils import _parse_requirements
@@ -24,6 +25,26 @@ def __init__(
         self.conda_env = _format_conda_env(conda_env)
         self.model_name = model_name
 
+    @hook_impl
+    def after_catalog_created(
+        self,
+        catalog: DataCatalog,
+        conf_catalog: Dict[str, Any],
+        conf_creds: Dict[str, Any],
+        feed_dict: Dict[str, Any],
+        save_version: str,
+        load_versions: str,
+        run_id: str
+    ):
+        for name, dataset in catalog._data_sets.items():
+            if isinstance(dataset, MlflowMetricsDataSet) and dataset._prefix is None:
+                if dataset._run_id is not None:
+                    catalog._data_sets[name] = MlflowMetricsDataSet(
+                        run_id=dataset._run_id,
+                        prefix=name
+                    )
+                catalog._data_sets[name] = MlflowMetricsDataSet(prefix=name)
+
     @hook_impl
     def before_pipeline_run(
         self, run_params: Dict[str, Any], pipeline: Pipeline, catalog: DataCatalog

diff --git a/kedro_mlflow/io/__init__.py b/kedro_mlflow/io/__init__.py
@@ -1 +1,2 @@
 from .mlflow_dataset import MlflowDataSet
+from .mlflow_metrics_dataset import MlflowMetricsDataSet
diff --git a/kedro_mlflow/io/mlflow_metrics_dataset.py b/kedro_mlflow/io/mlflow_metrics_dataset.py
@@ -0,0 +1,178 @@
+from copy import deepcopy
+from functools import partial, reduce
+from itertools import chain
+from typing import Any, Dict, Generator, List, Optional, Tuple, Union
+
+import mlflow
+from kedro.io import AbstractDataSet, DataSetError
+from mlflow.tracking import MlflowClient
+
+MetricItem = Union[float, List[float], Dict[str, float], List[Dict[str, float]]]
+MetricTuple = Tuple[str, float, int]
+MetricsDict = Dict[str, MetricItem]
+
+
+class MlflowMetricsDataSet(AbstractDataSet):
+    """This class represent MLflow metrics dataset."""
+
+    def __init__(
+        self,
+        run_id: str = None,
+        prefix: Optional[str] = None,
+    ):
+        """Initialise MlflowMetricsDataSet.
+
+        Args:
+            prefix (Optional[str]): Prefix for metrics logged in MLflow.
+            run_id (str): ID of MLflow run.
+        """
+        self._prefix = prefix
+        self._run_id = run_id
+
+    def _load(self) -> MetricsDict:
+        """Load MlflowMetricDataSet.
+
+        Returns:
+            Dict[str, Union[int, float]]: Dictionary with MLflow metrics dataset.
+        """
+        client = MlflowClient()
+        run_id = self._get_run_id()
+        all_metrics = client._tracking_client.store.get_all_metrics(run_uuid=run_id)
+        dataset_metrics = filter(self._is_dataset_metric, all_metrics)
+        dataset = reduce(
+            lambda xs, x: self._update_metric(
+                # get_all_metrics returns last saved values per metric key.
+                # All values are required here.
+                client.get_metric_history(run_id, x.key),
+                xs,
+            ),
+            dataset_metrics,
+            {},
+        )
+        return dataset
+
+    def _save(self, data: MetricsDict) -> None:
+        """Save given MLflow metrics dataset and log it in MLflow as metrics.
+
+        Args:
+            data (MetricsDict): MLflow metrics dataset.
+        """
+        client = MlflowClient()
+        try:
+            run_id = self._get_run_id()
+        except DataSetError:
+            # If run_id can't be found log_metric would create new run.
+            run_id = None
+
+        log_metric = (
+            partial(client.log_metric, run_id)
+            if run_id is not None
+            else mlflow.log_metric
+        )
+        metrics = (
+            self._build_args_list_from_metric_item(k, v) for k, v, in data.items()
+        )
+        for k, v, i in chain.from_iterable(metrics):
+            log_metric(k, v, step=i)
+
+    def _exists(self) -> bool:
+        """Check if MLflow metrics dataset exists.
+
+        Returns:
+            bool: Is MLflow metrics dataset exists?
+        """
+        client = MlflowClient()
+        run_id = self._get_run_id()
+        all_metrics = client._tracking_client.store.get_all_metrics(run_uuid=run_id)
+        return any(self._is_dataset_metric(x) for x in all_metrics)
+
+    def _describe(self) -> Dict[str, Any]:
+        """Describe MLflow metrics dataset.
+
+        Returns:
+            Dict[str, Any]: Dictionary with MLflow metrics dataset description.
+        """
+        return {
+            "prefix": self._prefix,
+        }
+
+    def _get_run_id(self) -> str:
+        """Get run id.
+
+        If active run is not found, tries to find last experiment.
+
+        Raise `DataSetError` exception if run id can't be found.
+
+        Returns:
+            str: String contains run_id.
+        """
+        if self._run_id is not None:
+            return self._run_id
+        run = mlflow.active_run()
+        if run:
+            return run.info.run_id
+        raise DataSetError("Cannot find run id.")
+
+    def _is_dataset_metric(self, metric: mlflow.entities.Metric) -> bool:
+        """Check if given metric belongs to dataset.
+
+        Args:
+            metric (mlflow.entities.Metric): MLflow metric instance.
+        """
+        return self._prefix is None or (
+            self._prefix and metric.key.startswith(self._prefix)
+        )
+
+    @staticmethod
+    def _update_metric(
+        metrics: List[mlflow.entities.Metric], dataset: MetricsDict = {}
+    ) -> MetricsDict:
+        """Update metric in given dataset.
+
+        Args:
+            metrics (List[mlflow.entities.Metric]): List with MLflow metric objects.
+            dataset (MetricsDict): Dictionary contains MLflow metrics dataset.
+
+        Returns:
+            MetricsDict: Dictionary with MLflow metrics dataset.
+        """
+        for metric in metrics:
+            metric_dict = {"step": metric.step, "value": metric.value}
+            if metric.key in dataset:
+                if isinstance(dataset[metric.key], list):
+                    dataset[metric.key].append(metric_dict)
+                else:
+                    dataset[metric.key] = [dataset[metric.key], metric_dict]
+            else:
+                dataset[metric.key] = metric_dict
+        return dataset
+
+    def _build_args_list_from_metric_item(
+        self, key: str, value: MetricItem
+    ) -> Generator[MetricTuple, None, None]:
+        """Build list of tuples with metrics.
+
+        First element of a tuple is key, second metric value, third step.
+
+        If MLflow metrics dataset has prefix, it will be attached to key.
+
+        Args:
+            key (str): Metric key.
+            value (MetricItem): Metric value
+
+        Returns:
+            List[MetricTuple]: List with metrics as tuples.
+        """
+        if self._prefix:
+            key = f"{self._prefix}.{key}"
+        if isinstance(value, float):
+            return (i for i in [(key, value, 0)])
+        if isinstance(value, dict):
+            return (i for i in [(key, value["value"], value["step"])])
+        if isinstance(value, list) and len(value) > 0:
+            if isinstance(value[0], dict):
+                return ((key, x["value"], x["step"]) for x in value)
+            return ((key, v, i) for i, v in enumerate(value))
+        raise DataSetError(
+            f"Unexpected metric value. Should be of type `{MetricItem}`, got {type(value)}"
+        )
Original file line number	Diff line number	Diff line change
		@@ -1 +1,2 @@
		from .mlflow_dataset import MlflowDataSet
		from .mlflow_metrics_dataset import MlflowMetricsDataSet