kedro-org · jitu5 · May 7, 2024 · Apr 25, 2024 · Apr 25, 2024 · Apr 25, 2024
diff --git a/package/kedro_viz/data_access/managers.py b/package/kedro_viz/data_access/managers.py
@@ -199,6 +199,9 @@ def add_pipeline(self, registered_pipeline_id: str, pipeline: KedroPipeline):
                     modular_pipelines.add_output(
                         current_modular_pipeline_id, output_node
                     )
+            # add tags
+            if current_modular_pipeline_id is not None:
+                modular_pipelines.add_tags(current_modular_pipeline_id, task_node.tags)
 
     def add_node(self, registered_pipeline_id: str, node: KedroNode) -> TaskNode:
         """Add a Kedro node as a TaskNode to the NodesRepository

@@ -1,5 +1,6 @@
 """`kedro_viz.data_access.repositories.modular_pipelines`
 defines repository to centralise access to modular pipelines data."""
+
 from typing import Dict, Optional, Union
 
 from kedro_viz.constants import ROOT_MODULAR_PIPELINE_ID
@@ -161,6 +162,27 @@ def add_output(self, modular_pipeline_id: str, output_node: GraphNode):
         else:
             self.tree[modular_pipeline_id].external_outputs.add(output_node.id)
 
+    def add_tags(self, modular_pipeline_id: str, node_tags: set):
+        """
+        Add tags to a modular pipeline.
+
+        Args:
+            modular_pipeline_id: ID of the modular pipeline to add the tags to.
+            node_tags: The tags to add to the modular pipeline.
+
+        Example:
+            >>> modular_pipelines = ModularPipelinesRepository()
+            >>> node_tags = {"tag1", "tag2"}
+            >>> modular_pipelines.add_tags("data_science", node_tags)
+            >>> data_science_pipeline = modular_pipelines.get_or_create_modular_pipeline(
+            ...     "data_science"
+            ... )
+            >>> assert "tag1" in data_science_pipeline.tags
+            >>> assert "tag2" in data_science_pipeline.tags
+        """
+        if modular_pipeline_id in self.tree:
+            self.tree[modular_pipeline_id].tags |= node_tags
+
     def add_child(self, modular_pipeline_id: str, child: ModularPipelineChild):
         """Add a child to a modular pipeline.
         Args:

@@ -1,6 +1,7 @@
 """`kedro_viz.services.modular_pipelines` defines modular pipelines-related business logic.
 The service layer consist of pure functions operating on domain models.
 """
+
 from typing import Dict
 
 from kedro_viz.constants import ROOT_MODULAR_PIPELINE_ID
@@ -78,6 +79,7 @@ def expand_tree(
                 )
 
             expanded_tree[parent_id].pipelines.update(modular_pipeline_node.pipelines)
+            expanded_tree[parent_id].tags.update(modular_pipeline_node.tags)
             expanded_tree[parent_id].children.add(
                 ModularPipelineChild(
                     id=f"{parent_id}.{chunks[i]}",

@@ -184,7 +184,7 @@ def assert_example_data(response_data):
         {
             "id": "uk.data_processing",
             "name": "uk.data_processing",
-            "tags": [],
+            "tags": ["split"],
             "pipelines": ["__default__"],
             "type": "modularPipeline",
             "modular_pipelines": None,
@@ -195,7 +195,7 @@ def assert_example_data(response_data):
         {
             "id": "uk.data_science",
             "name": "uk.data_science",
-            "tags": [],
+            "tags": ["train"],
             "pipelines": ["__default__"],
             "type": "modularPipeline",
             "modular_pipelines": None,
@@ -206,7 +206,7 @@ def assert_example_data(response_data):
         {
             "id": "uk",
             "name": "uk",
-            "tags": [],
+            "tags": ["split", "train"],
             "pipelines": ["__default__"],
             "type": "modularPipeline",
             "modular_pipelines": None,
@@ -731,7 +731,7 @@ def test_get_pipeline(self, client):
             {
                 "id": "uk",
                 "name": "uk",
-                "tags": [],
+                "tags": ["train"],
                 "pipelines": ["data_science"],
                 "type": "modularPipeline",
                 "modular_pipelines": None,
@@ -742,7 +742,7 @@ def test_get_pipeline(self, client):
             {
                 "id": "uk.data_science",
                 "name": "uk.data_science",
-                "tags": [],
+                "tags": ["train"],
                 "pipelines": ["data_science"],
                 "type": "modularPipeline",
                 "modular_pipelines": None,

diff --git a/package/tests/test_data_access/test_repositories/test_modular_pipelines.py b/package/tests/test_data_access/test_repositories/test_modular_pipelines.py
@@ -83,3 +83,14 @@ def test_add_output_should_raise_if_adding_non_data_node(self, identity):
         modular_pipelines = ModularPipelinesRepository()
         with pytest.raises(ValueError):
             modular_pipelines.add_output("data_science", task_node)
+
+    def test_add_tags(self):
+        modular_pipelines = ModularPipelinesRepository()
+        node_tags = {"tag1", "tag2"}
+        modular_pipelines.get_or_create_modular_pipeline("data_science")
+        modular_pipelines.add_tags("data_science", node_tags)
+        data_science_pipeline = modular_pipelines.get_or_create_modular_pipeline(
+            "data_science"
+        )
+        assert "tag1" in data_science_pipeline.tags
+        assert "tag2" in data_science_pipeline.tags