DataDesigner/tests/engine/test_configurable_task.py
Johnny Greco 3d9f5185d7
refactor: remove task metadata property (#216)
* remove metadata

* docs and tests

* don't need that test

* use static method for generation strategy

* update docs

* add docstring
2026-01-15 14:12:11 -05:00

124 lines
4.5 KiB
Python

# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: Apache-2.0
from unittest.mock import Mock
import pandas as pd
import pytest
from data_designer.config.base import ConfigBase
from data_designer.engine.configurable_task import ConfigurableTask, DataT, TaskConfigT
from data_designer.engine.dataset_builders.artifact_storage import ArtifactStorage
from data_designer.engine.models.registry import ModelRegistry
from data_designer.engine.resources.resource_provider import ResourceProvider
def test_configurable_task_generic_type_variables() -> None:
assert DataT.__constraints__ == (dict, pd.DataFrame)
assert TaskConfigT.__bound__ == ConfigBase
def test_configurable_task_concrete_implementation() -> None:
class TestConfig(ConfigBase):
value: str
class TestTask(ConfigurableTask[TestConfig]):
@classmethod
def get_config_type(cls) -> type[TestConfig]:
return TestConfig
def _validate(self) -> None:
pass
def _initialize(self) -> None:
pass
config = TestConfig(value="test")
mock_artifact_storage = Mock(spec=ArtifactStorage)
mock_artifact_storage.dataset_name = "test_dataset"
mock_artifact_storage.final_dataset_folder_name = "final_dataset"
mock_artifact_storage.partial_results_folder_name = "partial_results"
mock_artifact_storage.dropped_columns_folder_name = "dropped_columns"
mock_artifact_storage.processors_outputs_folder_name = "processors_outputs"
resource_provider = ResourceProvider(artifact_storage=mock_artifact_storage)
task = TestTask(config=config, resource_provider=resource_provider)
assert task._config == config
assert task._resource_provider == resource_provider
def test_configurable_task_config_validation() -> None:
class TestConfig(ConfigBase):
value: str
class TestTask(ConfigurableTask[TestConfig]):
@classmethod
def get_config_type(cls) -> type[TestConfig]:
return TestConfig
def _validate(self) -> None:
if self._config.value == "invalid":
raise ValueError("Invalid config")
config = TestConfig(value="test")
mock_artifact_storage = Mock(spec=ArtifactStorage)
mock_artifact_storage.dataset_name = "test_dataset"
mock_artifact_storage.final_dataset_folder_name = "final_dataset"
mock_artifact_storage.partial_results_folder_name = "partial_results"
mock_artifact_storage.dropped_columns_folder_name = "dropped_columns"
mock_artifact_storage.processors_outputs_folder_name = "processors_outputs"
resource_provider = ResourceProvider(artifact_storage=mock_artifact_storage)
task = TestTask(config=config, resource_provider=resource_provider)
assert task._config.value == "test"
invalid_config = TestConfig(value="invalid")
with pytest.raises(ValueError, match="Invalid config"):
TestTask(config=invalid_config, resource_provider=resource_provider)
def test_configurable_task_resource_validation() -> None:
class TestConfig(ConfigBase):
value: str
class TestTask(ConfigurableTask[TestConfig]):
@classmethod
def get_config_type(cls) -> type[TestConfig]:
return TestConfig
def _validate(self) -> None:
pass
def _initialize(self) -> None:
pass
config = TestConfig(value="test")
mock_artifact_storage = Mock(spec=ArtifactStorage)
mock_artifact_storage.dataset_name = "test_dataset"
mock_artifact_storage.final_dataset_folder_name = "final_dataset"
mock_artifact_storage.partial_results_folder_name = "partial_results"
mock_artifact_storage.dropped_columns_folder_name = "dropped_columns"
mock_artifact_storage.processors_outputs_folder_name = "processors_outputs"
mock_model_registry = Mock(spec=ModelRegistry)
resource_provider = ResourceProvider(artifact_storage=mock_artifact_storage, model_registry=mock_model_registry)
task = TestTask(config=config, resource_provider=resource_provider)
assert task._resource_provider == resource_provider
def test_configurable_task_resource_provider_is_none() -> None:
class TestConfig(ConfigBase):
value: str
class TestTask(ConfigurableTask[TestConfig]):
def _validate(self) -> None:
pass
def _initialize(self) -> None:
pass
config = TestConfig(value="test")
task = TestTask(config=config, resource_provider=None)
assert task._resource_provider is None