From 95dfae4fa006703584c1181b52d6e2d32c91d932 Mon Sep 17 00:00:00 2001 From: Maxime Armstrong Date: Thu, 19 Dec 2024 19:33:22 -0500 Subject: [PATCH 1/9] [dagster-powerbi] Implement copy_with_context in DagsterPowerBITranslator --- .../dagster_powerbi/resource.py | 2 +- .../dagster_powerbi/translator.py | 41 ++++++++++- .../dagster_powerbi_tests/test_translator.py | 70 +++++++++++++++++++ 3 files changed, 111 insertions(+), 2 deletions(-) diff --git a/python_modules/libraries/dagster-powerbi/dagster_powerbi/resource.py b/python_modules/libraries/dagster-powerbi/dagster_powerbi/resource.py index 246f699b223dd..4627233bf4ff3 100644 --- a/python_modules/libraries/dagster-powerbi/dagster_powerbi/resource.py +++ b/python_modules/libraries/dagster-powerbi/dagster_powerbi/resource.py @@ -437,7 +437,7 @@ def fetch_state(self) -> PowerBIWorkspaceData: ) def defs_from_state(self, state: PowerBIWorkspaceData) -> Definitions: - translator = self.translator_cls(context=state) + translator = self.translator_cls().copy_with_context(context=state) all_external_data = [ *state.dashboards_by_id.values(), diff --git a/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py b/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py index 01e6b0ef5ac74..7e5816586d543 100644 --- a/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py +++ b/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py @@ -1,9 +1,11 @@ +import inspect import re import urllib.parse from enum import Enum from typing import Any, Dict, List, Literal, Optional, Sequence from dagster import ( + DagsterInvariantViolationError, UrlMetadataValue, _check as check, ) @@ -155,9 +157,46 @@ class DagsterPowerBITranslator: Subclass this class to implement custom logic for each type of PowerBI content. """ - def __init__(self, context: PowerBIWorkspaceData): + def __init__(self, context: Optional[PowerBIWorkspaceData] = None): + if type(self).__init__ is not DagsterPowerBITranslator.__init__ and "context" not in set( + inspect.getfullargspec(type(self).__init__).args + ): + raise DagsterInvariantViolationError( + f"Invalid custom `__init__` function in custom translator class {type(self)}. " + f"The custom `__init__` function must include " + f"the parameter `context` of type `Optional[PowerBIWorkspaceData]` with default `None`." + ) self._context = context + def get_init_kwargs_from_instance(self): + _vars = vars(self) + _params = set(inspect.getfullargspec(self.__init__).args) + + # self.__init__ will always include self as a parameter + _params.remove("self") + + kwargs = {} + for param in _params: + private_param = f"_{param}" + if param not in _vars and private_param not in _vars: + raise KeyError( + f"Could not find __init__ param {param} or it's private counterpart {private_param} " + f"in the attributes {_vars} of translator {self}. " + f"Make sure that your __init__ parameters matches the attributes of your translator." + ) + kwargs[param] = _vars.get(param) or _vars.get(private_param) + return kwargs + + def copy_with_context(self, context: PowerBIWorkspaceData): + kwargs = self.get_init_kwargs_from_instance() + if kwargs.get("context"): + raise DagsterInvariantViolationError( + f"The context already exist on this translator instance {self}. " + "Cannot create a new translator instance with new context." + ) + kwargs["context"] = context + return self.__class__(**kwargs) + @property def workspace_data(self) -> PowerBIWorkspaceData: return self._context diff --git a/python_modules/libraries/dagster-powerbi/dagster_powerbi_tests/test_translator.py b/python_modules/libraries/dagster-powerbi/dagster_powerbi_tests/test_translator.py index cb43e33c7f00a..af49182f66cf0 100644 --- a/python_modules/libraries/dagster-powerbi/dagster_powerbi_tests/test_translator.py +++ b/python_modules/libraries/dagster-powerbi/dagster_powerbi_tests/test_translator.py @@ -1,8 +1,12 @@ +from typing import Optional + +import pytest from dagster._core.definitions.asset_key import AssetKey from dagster._core.definitions.asset_spec import AssetSpec from dagster._core.definitions.metadata.metadata_value import MetadataValue from dagster._core.definitions.metadata.table import TableColumn, TableSchema from dagster._core.definitions.tags import build_kind_tag +from dagster._core.errors import DagsterInvariantViolationError from dagster_powerbi import DagsterPowerBITranslator from dagster_powerbi.translator import PowerBIContentData, PowerBIContentType, PowerBIWorkspaceData @@ -136,6 +140,72 @@ def test_translator_custom_metadata(workspace_data: PowerBIWorkspaceData) -> Non assert asset_spec.key.path == ["prefix", "dashboard", "Sales_Returns_Sample_v201912"] +class MyCustomTranslatorWithInitParam(DagsterPowerBITranslator): + def __init__(self, my_param: str, context: Optional[PowerBIWorkspaceData] = None): + self.my_param = my_param + super().__init__(context=context) + + def get_asset_spec(self, data: PowerBIContentData) -> AssetSpec: + default_spec = super().get_asset_spec(data) + return default_spec.replace_attributes( + key=default_spec.key.with_prefix("prefix"), + metadata={**default_spec.metadata, "custom": self.my_param}, + ) + + +def test_custom_translator_with_init_param(workspace_data: PowerBIWorkspaceData) -> None: + dashboard = next(iter(workspace_data.dashboards_by_id.values())) + + test_param = "test" + translator = MyCustomTranslatorWithInitParam(my_param=test_param).copy_with_context( + context=workspace_data + ) + asset_spec = translator.get_asset_spec(dashboard) + + assert "custom" in asset_spec.metadata + assert asset_spec.metadata["custom"] == test_param + assert asset_spec.key.path == ["prefix", "dashboard", "Sales_Returns_Sample_v201912"] + + +def test_custom_translator_with_existing_context(workspace_data: PowerBIWorkspaceData) -> None: + translator = MyCustomTranslatorWithInitParam(my_param="test", context=workspace_data) + with pytest.raises( + DagsterInvariantViolationError, + match="The context already exist on this translator instance", + ): + translator.copy_with_context(context=workspace_data) + + +class MyCustomTranslatorWithInvalidInitParam(DagsterPowerBITranslator): + def __init__(self, my_param: str): + self.my_param = my_param + super().__init__() + + +def test_custom_translator_with_invalid_init_param(workspace_data: PowerBIWorkspaceData) -> None: + with pytest.raises( + DagsterInvariantViolationError, + match="Invalid custom `__init__` function in custom translator class", + ): + MyCustomTranslatorWithInvalidInitParam(my_param="test") + + +class MyCustomTranslatorWithInvalidAttribute(DagsterPowerBITranslator): + def __init__(self, my_param: str, context: Optional[PowerBIWorkspaceData] = None): + self.another_param_name = my_param + super().__init__(context=context) + + +def test_custom_translator_with_invalid_attribute(workspace_data: PowerBIWorkspaceData) -> None: + with pytest.raises( + KeyError, + match="Could not find __init__ param", + ): + MyCustomTranslatorWithInvalidAttribute(my_param="test").copy_with_context( + context=workspace_data + ) + + def test_translator_report_spec_no_dataset(workspace_data: PowerBIWorkspaceData) -> None: report_no_dataset = PowerBIContentData( content_type=PowerBIContentType.REPORT, From f29bcb970514c3cafb01a7c2a800193e84ac72cd Mon Sep 17 00:00:00 2001 From: Maxime Armstrong Date: Thu, 19 Dec 2024 19:36:33 -0500 Subject: [PATCH 2/9] Use brackets to access context --- .../libraries/dagster-powerbi/dagster_powerbi/translator.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py b/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py index 7e5816586d543..4287937d0c190 100644 --- a/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py +++ b/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py @@ -189,7 +189,7 @@ def get_init_kwargs_from_instance(self): def copy_with_context(self, context: PowerBIWorkspaceData): kwargs = self.get_init_kwargs_from_instance() - if kwargs.get("context"): + if kwargs["context"]: raise DagsterInvariantViolationError( f"The context already exist on this translator instance {self}. " "Cannot create a new translator instance with new context." From f057496bda4934b7ac0dc3100b26bdd990b45ec9 Mon Sep 17 00:00:00 2001 From: Maxime Armstrong Date: Thu, 19 Dec 2024 19:38:56 -0500 Subject: [PATCH 3/9] Update exception --- .../libraries/dagster-powerbi/dagster_powerbi/translator.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py b/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py index 4287937d0c190..ec827f0d637e2 100644 --- a/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py +++ b/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py @@ -180,9 +180,9 @@ def get_init_kwargs_from_instance(self): private_param = f"_{param}" if param not in _vars and private_param not in _vars: raise KeyError( - f"Could not find __init__ param {param} or it's private counterpart {private_param} " + f"Could not find `__init__` param {param} or it's private counterpart {private_param} " f"in the attributes {_vars} of translator {self}. " - f"Make sure that your __init__ parameters matches the attributes of your translator." + f"Make sure that your `__init__` parameters matches the attributes of your translator." ) kwargs[param] = _vars.get(param) or _vars.get(private_param) return kwargs From 94e5c0453f875760905348803d073f607117945f Mon Sep 17 00:00:00 2001 From: Maxime Armstrong Date: Thu, 19 Dec 2024 19:55:16 -0500 Subject: [PATCH 4/9] Update test --- .../dagster-powerbi/dagster_powerbi_tests/test_translator.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python_modules/libraries/dagster-powerbi/dagster_powerbi_tests/test_translator.py b/python_modules/libraries/dagster-powerbi/dagster_powerbi_tests/test_translator.py index af49182f66cf0..8796b3766479a 100644 --- a/python_modules/libraries/dagster-powerbi/dagster_powerbi_tests/test_translator.py +++ b/python_modules/libraries/dagster-powerbi/dagster_powerbi_tests/test_translator.py @@ -199,7 +199,7 @@ def __init__(self, my_param: str, context: Optional[PowerBIWorkspaceData] = None def test_custom_translator_with_invalid_attribute(workspace_data: PowerBIWorkspaceData) -> None: with pytest.raises( KeyError, - match="Could not find __init__ param", + match="Could not find `__init__` param", ): MyCustomTranslatorWithInvalidAttribute(my_param="test").copy_with_context( context=workspace_data From 882b2bf95f621f44ee94c53c0fe06416406b5dc2 Mon Sep 17 00:00:00 2001 From: Maxime Armstrong Date: Thu, 19 Dec 2024 19:56:26 -0500 Subject: [PATCH 5/9] Create properties for conditions --- .../dagster-powerbi/dagster_powerbi/translator.py | 14 +++++++++++--- .../dagster_powerbi_tests/test_translator.py | 2 +- 2 files changed, 12 insertions(+), 4 deletions(-) diff --git a/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py b/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py index ec827f0d637e2..d33572b8edeb1 100644 --- a/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py +++ b/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py @@ -158,9 +158,7 @@ class DagsterPowerBITranslator: """ def __init__(self, context: Optional[PowerBIWorkspaceData] = None): - if type(self).__init__ is not DagsterPowerBITranslator.__init__ and "context" not in set( - inspect.getfullargspec(type(self).__init__).args - ): + if self._has_custom_init_function and not self._has_context_param_in_init_function: raise DagsterInvariantViolationError( f"Invalid custom `__init__` function in custom translator class {type(self)}. " f"The custom `__init__` function must include " @@ -197,6 +195,16 @@ def copy_with_context(self, context: PowerBIWorkspaceData): kwargs["context"] = context return self.__class__(**kwargs) + @property + def _has_custom_init_function(self) -> bool: + return type(self).__init__ is not DagsterPowerBITranslator.__init__ + + @property + def _has_context_param_in_init_function(self) -> bool: + return "context" in set( + inspect.getfullargspec(type(self).__init__).args + ) + @property def workspace_data(self) -> PowerBIWorkspaceData: return self._context diff --git a/python_modules/libraries/dagster-powerbi/dagster_powerbi_tests/test_translator.py b/python_modules/libraries/dagster-powerbi/dagster_powerbi_tests/test_translator.py index 8796b3766479a..4acfbd3f3536d 100644 --- a/python_modules/libraries/dagster-powerbi/dagster_powerbi_tests/test_translator.py +++ b/python_modules/libraries/dagster-powerbi/dagster_powerbi_tests/test_translator.py @@ -199,7 +199,7 @@ def __init__(self, my_param: str, context: Optional[PowerBIWorkspaceData] = None def test_custom_translator_with_invalid_attribute(workspace_data: PowerBIWorkspaceData) -> None: with pytest.raises( KeyError, - match="Could not find `__init__` param", + match="Could not find `__init__ param", ): MyCustomTranslatorWithInvalidAttribute(my_param="test").copy_with_context( context=workspace_data From 2019b5d0003e930036ebfb9853717d7794b4c809 Mon Sep 17 00:00:00 2001 From: Maxime Armstrong Date: Thu, 19 Dec 2024 20:01:25 -0500 Subject: [PATCH 6/9] Update test --- .../dagster-powerbi/dagster_powerbi_tests/test_translator.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python_modules/libraries/dagster-powerbi/dagster_powerbi_tests/test_translator.py b/python_modules/libraries/dagster-powerbi/dagster_powerbi_tests/test_translator.py index 4acfbd3f3536d..8796b3766479a 100644 --- a/python_modules/libraries/dagster-powerbi/dagster_powerbi_tests/test_translator.py +++ b/python_modules/libraries/dagster-powerbi/dagster_powerbi_tests/test_translator.py @@ -199,7 +199,7 @@ def __init__(self, my_param: str, context: Optional[PowerBIWorkspaceData] = None def test_custom_translator_with_invalid_attribute(workspace_data: PowerBIWorkspaceData) -> None: with pytest.raises( KeyError, - match="Could not find `__init__ param", + match="Could not find `__init__` param", ): MyCustomTranslatorWithInvalidAttribute(my_param="test").copy_with_context( context=workspace_data From 0307489ae75acc9d244af16464c8ae8b616bd9a9 Mon Sep 17 00:00:00 2001 From: Maxime Armstrong Date: Thu, 19 Dec 2024 20:05:15 -0500 Subject: [PATCH 7/9] Fix pyright --- .../libraries/dagster-powerbi/dagster_powerbi/translator.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py b/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py index d33572b8edeb1..888ec031201e0 100644 --- a/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py +++ b/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py @@ -207,7 +207,7 @@ def _has_context_param_in_init_function(self) -> bool: @property def workspace_data(self) -> PowerBIWorkspaceData: - return self._context + return check.not_none(self._context) def get_asset_spec(self, data: PowerBIContentData) -> AssetSpec: if data.content_type == PowerBIContentType.DASHBOARD: From 62c78aebf8d466bd894f4b6aed6f4e3b9bf50ff7 Mon Sep 17 00:00:00 2001 From: Maxime Armstrong Date: Thu, 19 Dec 2024 20:07:15 -0500 Subject: [PATCH 8/9] Make get init kwargs private --- .../libraries/dagster-powerbi/dagster_powerbi/translator.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py b/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py index 888ec031201e0..ccf773d53f4cd 100644 --- a/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py +++ b/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py @@ -166,7 +166,7 @@ def __init__(self, context: Optional[PowerBIWorkspaceData] = None): ) self._context = context - def get_init_kwargs_from_instance(self): + def _get_init_kwargs_from_instance(self): _vars = vars(self) _params = set(inspect.getfullargspec(self.__init__).args) @@ -186,7 +186,7 @@ def get_init_kwargs_from_instance(self): return kwargs def copy_with_context(self, context: PowerBIWorkspaceData): - kwargs = self.get_init_kwargs_from_instance() + kwargs = self._get_init_kwargs_from_instance() if kwargs["context"]: raise DagsterInvariantViolationError( f"The context already exist on this translator instance {self}. " From 8cd5486f7977c79229f22c3dc6ad5d33795c46cc Mon Sep 17 00:00:00 2001 From: Maxime Armstrong Date: Thu, 19 Dec 2024 20:07:35 -0500 Subject: [PATCH 9/9] Lint --- .../libraries/dagster-powerbi/dagster_powerbi/translator.py | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py b/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py index ccf773d53f4cd..203c1e81baf01 100644 --- a/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py +++ b/python_modules/libraries/dagster-powerbi/dagster_powerbi/translator.py @@ -201,9 +201,7 @@ def _has_custom_init_function(self) -> bool: @property def _has_context_param_in_init_function(self) -> bool: - return "context" in set( - inspect.getfullargspec(type(self).__init__).args - ) + return "context" in set(inspect.getfullargspec(type(self).__init__).args) @property def workspace_data(self) -> PowerBIWorkspaceData: